gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2014 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "tm.h"
  25 #include "diagnostic-core.h"
  26
  27 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  28    is properly defined.  */
  29 #include "insn-config.h"
  30 #include "rtl.h"
  31 #include "tree.h"
  32 #include "tree-hasher.h"
  33 #include "stor-layout.h"
  34 #include "stringpool.h"
  35 #include "varasm.h"
  36 #include "tm_p.h"
  37 #include "flags.h"
  38 #include "hashtab.h"
  39 #include "hash-set.h"
  40 #include "vec.h"
  41 #include "machmode.h"
  42 #include "hard-reg-set.h"
  43 #include "input.h"
  44 #include "function.h"
  45 #include "except.h"
  46 #include "expr.h"
  47 #include "insn-codes.h"
  48 #include "optabs.h"
  49 #include "libfuncs.h"
  50 #include "recog.h"
  51 #include "reload.h"
  52 #include "ggc.h"
  53 #include "predict.h"
  54 #include "dominance.h"
  55 #include "cfg.h"
  56 #include "basic-block.h"
  57 #include "target.h"
  58
  59 struct target_optabs default_target_optabs;
  60 struct target_libfuncs default_target_libfuncs;
  61 struct target_optabs *this_fn_optabs = &default_target_optabs;
  62 #if SWITCHABLE_TARGET
  63 struct target_optabs *this_target_optabs = &default_target_optabs;
  64 struct target_libfuncs *this_target_libfuncs = &default_target_libfuncs;
  65 #endif
  66
  67 #define libfunc_hash \
  68   (this_target_libfuncs->x_libfunc_hash)
  69
  70 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  71                                    machine_mode *);
  72 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  73 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  74
  75 /* Debug facility for use in GDB.  */
  76 void debug_optab_libfuncs (void);
  77
  78 /* Prefixes for the current version of decimal floating point (BID vs. DPD) */
  79 #if ENABLE_DECIMAL_BID_FORMAT
  80 #define DECIMAL_PREFIX "bid_"
  81 #else
  82 #define DECIMAL_PREFIX "dpd_"
  83 #endif
  84 \f
  85 /* Used for libfunc_hash.  */
  86
  87 hashval_t
  88 libfunc_hasher::hash (libfunc_entry *e)
  89 {
  90   return ((e->mode1 + e->mode2 * NUM_MACHINE_MODES) ^ e->op);
  91 }
  92
  93 /* Used for libfunc_hash.  */
  94
  95 bool
  96 libfunc_hasher::equal (libfunc_entry *e1, libfunc_entry *e2)
  97 {
  98   return e1->op == e2->op && e1->mode1 == e2->mode1 && e1->mode2 == e2->mode2;
  99 }
 100
 101 /* Return libfunc corresponding operation defined by OPTAB converting
 102    from MODE2 to MODE1.  Trigger lazy initialization if needed, return NULL
 103    if no libfunc is available.  */
 104 rtx
 105 convert_optab_libfunc (convert_optab optab, machine_mode mode1,
 106                        machine_mode mode2)
 107 {
 108   struct libfunc_entry e;
 109   struct libfunc_entry **slot;
 110
 111   /* ??? This ought to be an assert, but not all of the places
 112      that we expand optabs know about the optabs that got moved
 113      to being direct.  */
 114   if (!(optab >= FIRST_CONV_OPTAB && optab <= LAST_CONVLIB_OPTAB))
 115     return NULL_RTX;
 116
 117   e.op = optab;
 118   e.mode1 = mode1;
 119   e.mode2 = mode2;
 120   slot = libfunc_hash->find_slot (&e, NO_INSERT);
 121   if (!slot)
 122     {
 123       const struct convert_optab_libcall_d *d
 124         = &convlib_def[optab - FIRST_CONV_OPTAB];
 125
 126       if (d->libcall_gen == NULL)
 127         return NULL;
 128
 129       d->libcall_gen (optab, d->libcall_basename, mode1, mode2);
 130       slot = libfunc_hash->find_slot (&e, NO_INSERT);
 131       if (!slot)
 132         return NULL;
 133     }
 134   return (*slot)->libfunc;
 135 }
 136
 137 /* Return libfunc corresponding operation defined by OPTAB in MODE.
 138    Trigger lazy initialization if needed, return NULL if no libfunc is
 139    available.  */
 140 rtx
 141 optab_libfunc (optab optab, machine_mode mode)
 142 {
 143   struct libfunc_entry e;
 144   struct libfunc_entry **slot;
 145
 146   /* ??? This ought to be an assert, but not all of the places
 147      that we expand optabs know about the optabs that got moved
 148      to being direct.  */
 149   if (!(optab >= FIRST_NORM_OPTAB && optab <= LAST_NORMLIB_OPTAB))
 150     return NULL_RTX;
 151
 152   e.op = optab;
 153   e.mode1 = mode;
 154   e.mode2 = VOIDmode;
 155   slot = libfunc_hash->find_slot (&e, NO_INSERT);
 156   if (!slot)
 157     {
 158       const struct optab_libcall_d *d
 159         = &normlib_def[optab - FIRST_NORM_OPTAB];
 160
 161       if (d->libcall_gen == NULL)
 162         return NULL;
 163
 164       d->libcall_gen (optab, d->libcall_basename, d->libcall_suffix, mode);
 165       slot = libfunc_hash->find_slot (&e, NO_INSERT);
 166       if (!slot)
 167         return NULL;
 168     }
 169   return (*slot)->libfunc;
 170 }
 171
 172 \f
 173 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
 174    the result of operation CODE applied to OP0 (and OP1 if it is a binary
 175    operation).
 176
 177    If the last insn does not set TARGET, don't do anything, but return 1.
 178
 179    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
 180    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
 181    try again, ensuring that TARGET is not one of the operands.  */
 182
 183 static int
 184 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
 185 {
 186   rtx_insn *last_insn;
 187   rtx set;
 188   rtx note;
 189
 190   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
 191
 192   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
 193       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
 194       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
 195       && GET_RTX_CLASS (code) != RTX_COMPARE
 196       && GET_RTX_CLASS (code) != RTX_UNARY)
 197     return 1;
 198
 199   if (GET_CODE (target) == ZERO_EXTRACT)
 200     return 1;
 201
 202   for (last_insn = insns;
 203        NEXT_INSN (last_insn) != NULL_RTX;
 204        last_insn = NEXT_INSN (last_insn))
 205     ;
 206
 207   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
 208      a value changing in the insn, so the note would be invalid for CSE.  */
 209   if (reg_overlap_mentioned_p (target, op0)
 210       || (op1 && reg_overlap_mentioned_p (target, op1)))
 211     {
 212       if (MEM_P (target)
 213           && (rtx_equal_p (target, op0)
 214               || (op1 && rtx_equal_p (target, op1))))
 215         {
 216           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 217              over expanding it as temp = MEM op X, MEM = temp.  If the target
 218              supports MEM = MEM op X instructions, it is sometimes too hard
 219              to reconstruct that form later, especially if X is also a memory,
 220              and due to multiple occurrences of addresses the address might
 221              be forced into register unnecessarily.
 222              Note that not emitting the REG_EQUIV note might inhibit
 223              CSE in some cases.  */
 224           set = single_set (last_insn);
 225           if (set
 226               && GET_CODE (SET_SRC (set)) == code
 227               && MEM_P (SET_DEST (set))
 228               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 229                   || (op1 && rtx_equal_p (SET_DEST (set),
 230                                           XEXP (SET_SRC (set), 1)))))
 231             return 1;
 232         }
 233       return 0;
 234     }
 235
 236   set = set_for_reg_notes (last_insn);
 237   if (set == NULL_RTX)
 238     return 1;
 239
 240   if (! rtx_equal_p (SET_DEST (set), target)
 241       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 242       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 243           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 244     return 1;
 245
 246   if (GET_RTX_CLASS (code) == RTX_UNARY)
 247     switch (code)
 248       {
 249       case FFS:
 250       case CLZ:
 251       case CTZ:
 252       case CLRSB:
 253       case POPCOUNT:
 254       case PARITY:
 255       case BSWAP:
 256         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 257           {
 258             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 259             if (GET_MODE_SIZE (GET_MODE (op0))
 260                 > GET_MODE_SIZE (GET_MODE (target)))
 261               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 262                                          note, GET_MODE (op0));
 263             else
 264               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 265                                          note, GET_MODE (op0));
 266             break;
 267           }
 268         /* FALLTHRU */
 269       default:
 270         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 271         break;
 272       }
 273   else
 274     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 275
 276   set_unique_reg_note (last_insn, REG_EQUAL, note);
 277
 278   return 1;
 279 }
 280 \f
 281 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 282    for a widening operation would be.  In most cases this would be OP0, but if
 283    that's a constant it'll be VOIDmode, which isn't useful.  */
 284
 285 static machine_mode
 286 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 287 {
 288   machine_mode m0 = GET_MODE (op0);
 289   machine_mode m1 = GET_MODE (op1);
 290   machine_mode result;
 291
 292   if (m0 == VOIDmode && m1 == VOIDmode)
 293     return to_mode;
 294   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 295     result = m1;
 296   else
 297     result = m0;
 298
 299   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 300     return to_mode;
 301
 302   return result;
 303 }
 304 \f
 305 /* Like optab_handler, but for widening_operations that have a
 306    TO_MODE and a FROM_MODE.  */
 307
 308 enum insn_code
 309 widening_optab_handler (optab op, machine_mode to_mode,
 310                         machine_mode from_mode)
 311 {
 312   unsigned scode = (op << 16) | to_mode;
 313   if (to_mode != from_mode && from_mode != VOIDmode)
 314     {
 315       /* ??? Why does find_widening_optab_handler_and_mode attempt to
 316          widen things that can't be widened?  E.g. add_optab... */
 317       if (op > LAST_CONV_OPTAB)
 318         return CODE_FOR_nothing;
 319       scode |= from_mode << 8;
 320     }
 321   return raw_optab_handler (scode);
 322 }
 323
 324 /* Find a widening optab even if it doesn't widen as much as we want.
 325    E.g. if from_mode is HImode, and to_mode is DImode, and there is no
 326    direct HI->SI insn, then return SI->DI, if that exists.
 327    If PERMIT_NON_WIDENING is non-zero then this can be used with
 328    non-widening optabs also.  */
 329
 330 enum insn_code
 331 find_widening_optab_handler_and_mode (optab op, machine_mode to_mode,
 332                                       machine_mode from_mode,
 333                                       int permit_non_widening,
 334                                       machine_mode *found_mode)
 335 {
 336   for (; (permit_non_widening || from_mode != to_mode)
 337          && GET_MODE_SIZE (from_mode) <= GET_MODE_SIZE (to_mode)
 338          && from_mode != VOIDmode;
 339        from_mode = GET_MODE_WIDER_MODE (from_mode))
 340     {
 341       enum insn_code handler = widening_optab_handler (op, to_mode,
 342                                                        from_mode);
 343
 344       if (handler != CODE_FOR_nothing)
 345         {
 346           if (found_mode)
 347             *found_mode = from_mode;
 348           return handler;
 349         }
 350     }
 351
 352   return CODE_FOR_nothing;
 353 }
 354 \f
 355 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 356    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 357    not actually do a sign-extend or zero-extend, but can leave the
 358    higher-order bits of the result rtx undefined, for example, in the case
 359    of logical operations, but not right shifts.  */
 360
 361 static rtx
 362 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 363                int unsignedp, int no_extend)
 364 {
 365   rtx result;
 366
 367   /* If we don't have to extend and this is a constant, return it.  */
 368   if (no_extend && GET_MODE (op) == VOIDmode)
 369     return op;
 370
 371   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 372      extend since it will be more efficient to do so unless the signedness of
 373      a promoted object differs from our extension.  */
 374   if (! no_extend
 375       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 376           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 377     return convert_modes (mode, oldmode, op, unsignedp);
 378
 379   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 380      SUBREG.  */
 381   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
 382     return gen_lowpart (mode, force_reg (GET_MODE (op), op));
 383
 384   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 385      part to OP.  */
 386
 387   result = gen_reg_rtx (mode);
 388   emit_clobber (result);
 389   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 390   return result;
 391 }
 392 \f
 393 /* Return the optab used for computing the operation given by the tree code,
 394    CODE and the tree EXP.  This function is not always usable (for example, it
 395    cannot give complete results for multiplication or division) but probably
 396    ought to be relied on more widely throughout the expander.  */
 397 optab
 398 optab_for_tree_code (enum tree_code code, const_tree type,
 399                      enum optab_subtype subtype)
 400 {
 401   bool trapv;
 402   switch (code)
 403     {
 404     case BIT_AND_EXPR:
 405       return and_optab;
 406
 407     case BIT_IOR_EXPR:
 408       return ior_optab;
 409
 410     case BIT_NOT_EXPR:
 411       return one_cmpl_optab;
 412
 413     case BIT_XOR_EXPR:
 414       return xor_optab;
 415
 416     case MULT_HIGHPART_EXPR:
 417       return TYPE_UNSIGNED (type) ? umul_highpart_optab : smul_highpart_optab;
 418
 419     case TRUNC_MOD_EXPR:
 420     case CEIL_MOD_EXPR:
 421     case FLOOR_MOD_EXPR:
 422     case ROUND_MOD_EXPR:
 423       return TYPE_UNSIGNED (type) ? umod_optab : smod_optab;
 424
 425     case RDIV_EXPR:
 426     case TRUNC_DIV_EXPR:
 427     case CEIL_DIV_EXPR:
 428     case FLOOR_DIV_EXPR:
 429     case ROUND_DIV_EXPR:
 430     case EXACT_DIV_EXPR:
 431       if (TYPE_SATURATING (type))
 432         return TYPE_UNSIGNED (type) ? usdiv_optab : ssdiv_optab;
 433       return TYPE_UNSIGNED (type) ? udiv_optab : sdiv_optab;
 434
 435     case LSHIFT_EXPR:
 436       if (TREE_CODE (type) == VECTOR_TYPE)
 437         {
 438           if (subtype == optab_vector)
 439             return TYPE_SATURATING (type) ? unknown_optab : vashl_optab;
 440
 441           gcc_assert (subtype == optab_scalar);
 442         }
 443       if (TYPE_SATURATING (type))
 444         return TYPE_UNSIGNED (type) ? usashl_optab : ssashl_optab;
 445       return ashl_optab;
 446
 447     case RSHIFT_EXPR:
 448       if (TREE_CODE (type) == VECTOR_TYPE)
 449         {
 450           if (subtype == optab_vector)
 451             return TYPE_UNSIGNED (type) ? vlshr_optab : vashr_optab;
 452
 453           gcc_assert (subtype == optab_scalar);
 454         }
 455       return TYPE_UNSIGNED (type) ? lshr_optab : ashr_optab;
 456
 457     case LROTATE_EXPR:
 458       if (TREE_CODE (type) == VECTOR_TYPE)
 459         {
 460           if (subtype == optab_vector)
 461             return vrotl_optab;
 462
 463           gcc_assert (subtype == optab_scalar);
 464         }
 465       return rotl_optab;
 466
 467     case RROTATE_EXPR:
 468       if (TREE_CODE (type) == VECTOR_TYPE)
 469         {
 470           if (subtype == optab_vector)
 471             return vrotr_optab;
 472
 473           gcc_assert (subtype == optab_scalar);
 474         }
 475       return rotr_optab;
 476
 477     case MAX_EXPR:
 478       return TYPE_UNSIGNED (type) ? umax_optab : smax_optab;
 479
 480     case MIN_EXPR:
 481       return TYPE_UNSIGNED (type) ? umin_optab : smin_optab;
 482
 483     case REALIGN_LOAD_EXPR:
 484       return vec_realign_load_optab;
 485
 486     case WIDEN_SUM_EXPR:
 487       return TYPE_UNSIGNED (type) ? usum_widen_optab : ssum_widen_optab;
 488
 489     case DOT_PROD_EXPR:
 490       return TYPE_UNSIGNED (type) ? udot_prod_optab : sdot_prod_optab;
 491
 492     case SAD_EXPR:
 493       return TYPE_UNSIGNED (type) ? usad_optab : ssad_optab;
 494
 495     case WIDEN_MULT_PLUS_EXPR:
 496       return (TYPE_UNSIGNED (type)
 497               ? (TYPE_SATURATING (type)
 498                  ? usmadd_widen_optab : umadd_widen_optab)
 499               : (TYPE_SATURATING (type)
 500                  ? ssmadd_widen_optab : smadd_widen_optab));
 501
 502     case WIDEN_MULT_MINUS_EXPR:
 503       return (TYPE_UNSIGNED (type)
 504               ? (TYPE_SATURATING (type)
 505                  ? usmsub_widen_optab : umsub_widen_optab)
 506               : (TYPE_SATURATING (type)
 507                  ? ssmsub_widen_optab : smsub_widen_optab));
 508
 509     case FMA_EXPR:
 510       return fma_optab;
 511
 512     case REDUC_MAX_EXPR:
 513       return TYPE_UNSIGNED (type)
 514              ? reduc_umax_scal_optab : reduc_smax_scal_optab;
 515
 516     case REDUC_MIN_EXPR:
 517       return TYPE_UNSIGNED (type)
 518              ? reduc_umin_scal_optab : reduc_smin_scal_optab;
 519
 520     case REDUC_PLUS_EXPR:
 521       return reduc_plus_scal_optab;
 522
 523     case VEC_RSHIFT_EXPR:
 524       return vec_shr_optab;
 525
 526     case VEC_WIDEN_MULT_HI_EXPR:
 527       return TYPE_UNSIGNED (type) ?
 528         vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
 529
 530     case VEC_WIDEN_MULT_LO_EXPR:
 531       return TYPE_UNSIGNED (type) ?
 532         vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
 533
 534     case VEC_WIDEN_MULT_EVEN_EXPR:
 535       return TYPE_UNSIGNED (type) ?
 536         vec_widen_umult_even_optab : vec_widen_smult_even_optab;
 537
 538     case VEC_WIDEN_MULT_ODD_EXPR:
 539       return TYPE_UNSIGNED (type) ?
 540         vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
 541
 542     case VEC_WIDEN_LSHIFT_HI_EXPR:
 543       return TYPE_UNSIGNED (type) ?
 544         vec_widen_ushiftl_hi_optab : vec_widen_sshiftl_hi_optab;
 545
 546     case VEC_WIDEN_LSHIFT_LO_EXPR:
 547       return TYPE_UNSIGNED (type) ?
 548         vec_widen_ushiftl_lo_optab : vec_widen_sshiftl_lo_optab;
 549
 550     case VEC_UNPACK_HI_EXPR:
 551       return TYPE_UNSIGNED (type) ?
 552         vec_unpacku_hi_optab : vec_unpacks_hi_optab;
 553
 554     case VEC_UNPACK_LO_EXPR:
 555       return TYPE_UNSIGNED (type) ?
 556         vec_unpacku_lo_optab : vec_unpacks_lo_optab;
 557
 558     case VEC_UNPACK_FLOAT_HI_EXPR:
 559       /* The signedness is determined from input operand.  */
 560       return TYPE_UNSIGNED (type) ?
 561         vec_unpacku_float_hi_optab : vec_unpacks_float_hi_optab;
 562
 563     case VEC_UNPACK_FLOAT_LO_EXPR:
 564       /* The signedness is determined from input operand.  */
 565       return TYPE_UNSIGNED (type) ?
 566         vec_unpacku_float_lo_optab : vec_unpacks_float_lo_optab;
 567
 568     case VEC_PACK_TRUNC_EXPR:
 569       return vec_pack_trunc_optab;
 570
 571     case VEC_PACK_SAT_EXPR:
 572       return TYPE_UNSIGNED (type) ? vec_pack_usat_optab : vec_pack_ssat_optab;
 573
 574     case VEC_PACK_FIX_TRUNC_EXPR:
 575       /* The signedness is determined from output operand.  */
 576       return TYPE_UNSIGNED (type) ?
 577         vec_pack_ufix_trunc_optab : vec_pack_sfix_trunc_optab;
 578
 579     default:
 580       break;
 581     }
 582
 583   trapv = INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type);
 584   switch (code)
 585     {
 586     case POINTER_PLUS_EXPR:
 587     case PLUS_EXPR:
 588       if (TYPE_SATURATING (type))
 589         return TYPE_UNSIGNED (type) ? usadd_optab : ssadd_optab;
 590       return trapv ? addv_optab : add_optab;
 591
 592     case MINUS_EXPR:
 593       if (TYPE_SATURATING (type))
 594         return TYPE_UNSIGNED (type) ? ussub_optab : sssub_optab;
 595       return trapv ? subv_optab : sub_optab;
 596
 597     case MULT_EXPR:
 598       if (TYPE_SATURATING (type))
 599         return TYPE_UNSIGNED (type) ? usmul_optab : ssmul_optab;
 600       return trapv ? smulv_optab : smul_optab;
 601
 602     case NEGATE_EXPR:
 603       if (TYPE_SATURATING (type))
 604         return TYPE_UNSIGNED (type) ? usneg_optab : ssneg_optab;
 605       return trapv ? negv_optab : neg_optab;
 606
 607     case ABS_EXPR:
 608       return trapv ? absv_optab : abs_optab;
 609
 610     default:
 611       return unknown_optab;
 612     }
 613 }
 614
 615 /* Given optab UNOPTAB that reduces a vector to a scalar, find instead the old
 616    optab that produces a vector with the reduction result in one element,
 617    for a tree with type TYPE.  */
 618
 619 optab
 620 scalar_reduc_to_vector (optab unoptab, const_tree type)
 621 {
 622   switch (unoptab)
 623     {
 624     case reduc_plus_scal_optab:
 625       return TYPE_UNSIGNED (type) ? reduc_uplus_optab : reduc_splus_optab;
 626
 627     case reduc_smin_scal_optab: return reduc_smin_optab;
 628     case reduc_umin_scal_optab: return reduc_umin_optab;
 629     case reduc_smax_scal_optab: return reduc_smax_optab;
 630     case reduc_umax_scal_optab: return reduc_umax_optab;
 631     default: return unknown_optab;
 632     }
 633 }
 634
 635 /* Expand vector widening operations.
 636
 637    There are two different classes of operations handled here:
 638    1) Operations whose result is wider than all the arguments to the operation.
 639       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 640       In this case OP0 and optionally OP1 would be initialized,
 641       but WIDE_OP wouldn't (not relevant for this case).
 642    2) Operations whose result is of the same size as the last argument to the
 643       operation, but wider than all the other arguments to the operation.
 644       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 645       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 646
 647    E.g, when called to expand the following operations, this is how
 648    the arguments will be initialized:
 649                                 nops    OP0     OP1     WIDE_OP
 650    widening-sum                 2       oprnd0  -       oprnd1
 651    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 652    widening-mult                2       oprnd0  oprnd1  -
 653    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 654
 655 rtx
 656 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 657                            rtx target, int unsignedp)
 658 {
 659   struct expand_operand eops[4];
 660   tree oprnd0, oprnd1, oprnd2;
 661   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 662   optab widen_pattern_optab;
 663   enum insn_code icode;
 664   int nops = TREE_CODE_LENGTH (ops->code);
 665   int op;
 666
 667   oprnd0 = ops->op0;
 668   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 669   widen_pattern_optab =
 670     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 671   if (ops->code == WIDEN_MULT_PLUS_EXPR
 672       || ops->code == WIDEN_MULT_MINUS_EXPR)
 673     icode = find_widening_optab_handler (widen_pattern_optab,
 674                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 675                                          tmode0, 0);
 676   else
 677     icode = optab_handler (widen_pattern_optab, tmode0);
 678   gcc_assert (icode != CODE_FOR_nothing);
 679
 680   if (nops >= 2)
 681     {
 682       oprnd1 = ops->op1;
 683       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 684     }
 685
 686   /* The last operand is of a wider mode than the rest of the operands.  */
 687   if (nops == 2)
 688     wmode = tmode1;
 689   else if (nops == 3)
 690     {
 691       gcc_assert (tmode1 == tmode0);
 692       gcc_assert (op1);
 693       oprnd2 = ops->op2;
 694       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 695     }
 696
 697   op = 0;
 698   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 699   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 700   if (op1)
 701     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 702   if (wide_op)
 703     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 704   expand_insn (icode, op, eops);
 705   return eops[0].value;
 706 }
 707
 708 /* Generate code to perform an operation specified by TERNARY_OPTAB
 709    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 710
 711    UNSIGNEDP is for the case where we have to widen the operands
 712    to perform the operation.  It says to use zero-extension.
 713
 714    If TARGET is nonzero, the value
 715    is generated there, if it is convenient to do so.
 716    In all cases an rtx is returned for the locus of the value;
 717    this may or may not be TARGET.  */
 718
 719 rtx
 720 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 721                    rtx op1, rtx op2, rtx target, int unsignedp)
 722 {
 723   struct expand_operand ops[4];
 724   enum insn_code icode = optab_handler (ternary_optab, mode);
 725
 726   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 727
 728   create_output_operand (&ops[0], target, mode);
 729   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 730   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 731   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 732   expand_insn (icode, 4, ops);
 733   return ops[0].value;
 734 }
 735
 736
 737 /* Like expand_binop, but return a constant rtx if the result can be
 738    calculated at compile time.  The arguments and return value are
 739    otherwise the same as for expand_binop.  */
 740
 741 rtx
 742 simplify_expand_binop (machine_mode mode, optab binoptab,
 743                        rtx op0, rtx op1, rtx target, int unsignedp,
 744                        enum optab_methods methods)
 745 {
 746   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 747     {
 748       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 749                                          mode, op0, op1);
 750       if (x)
 751         return x;
 752     }
 753
 754   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 755 }
 756
 757 /* Like simplify_expand_binop, but always put the result in TARGET.
 758    Return true if the expansion succeeded.  */
 759
 760 bool
 761 force_expand_binop (machine_mode mode, optab binoptab,
 762                     rtx op0, rtx op1, rtx target, int unsignedp,
 763                     enum optab_methods methods)
 764 {
 765   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 766                                  target, unsignedp, methods);
 767   if (x == 0)
 768     return false;
 769   if (x != target)
 770     emit_move_insn (target, x);
 771   return true;
 772 }
 773
 774 /* Generate insns for VEC_RSHIFT_EXPR.  */
 775
 776 rtx
 777 expand_vec_shift_expr (sepops ops, rtx target)
 778 {
 779   struct expand_operand eops[3];
 780   enum insn_code icode;
 781   rtx rtx_op1, rtx_op2;
 782   machine_mode mode = TYPE_MODE (ops->type);
 783   tree vec_oprnd = ops->op0;
 784   tree shift_oprnd = ops->op1;
 785
 786   gcc_assert (ops->code == VEC_RSHIFT_EXPR);
 787
 788   icode = optab_handler (vec_shr_optab, mode);
 789   gcc_assert (icode != CODE_FOR_nothing);
 790
 791   rtx_op1 = expand_normal (vec_oprnd);
 792   rtx_op2 = expand_normal (shift_oprnd);
 793
 794   create_output_operand (&eops[0], target, mode);
 795   create_input_operand (&eops[1], rtx_op1, GET_MODE (rtx_op1));
 796   create_convert_operand_from_type (&eops[2], rtx_op2, TREE_TYPE (shift_oprnd));
 797   expand_insn (icode, 3, eops);
 798
 799   return eops[0].value;
 800 }
 801
 802 /* Create a new vector value in VMODE with all elements set to OP.  The
 803    mode of OP must be the element mode of VMODE.  If OP is a constant,
 804    then the return value will be a constant.  */
 805
 806 static rtx
 807 expand_vector_broadcast (machine_mode vmode, rtx op)
 808 {
 809   enum insn_code icode;
 810   rtvec vec;
 811   rtx ret;
 812   int i, n;
 813
 814   gcc_checking_assert (VECTOR_MODE_P (vmode));
 815
 816   n = GET_MODE_NUNITS (vmode);
 817   vec = rtvec_alloc (n);
 818   for (i = 0; i < n; ++i)
 819     RTVEC_ELT (vec, i) = op;
 820
 821   if (CONSTANT_P (op))
 822     return gen_rtx_CONST_VECTOR (vmode, vec);
 823
 824   /* ??? If the target doesn't have a vec_init, then we have no easy way
 825      of performing this operation.  Most of this sort of generic support
 826      is hidden away in the vector lowering support in gimple.  */
 827   icode = optab_handler (vec_init_optab, vmode);
 828   if (icode == CODE_FOR_nothing)
 829     return NULL;
 830
 831   ret = gen_reg_rtx (vmode);
 832   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 833
 834   return ret;
 835 }
 836
 837 /* This subroutine of expand_doubleword_shift handles the cases in which
 838    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 839    value are the same as for the parent routine, except that SUPERWORD_OP1
 840    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 841    INTO_TARGET may be null if the caller has decided to calculate it.  */
 842
 843 static bool
 844 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 845                         rtx outof_target, rtx into_target,
 846                         int unsignedp, enum optab_methods methods)
 847 {
 848   if (into_target != 0)
 849     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 850                              into_target, unsignedp, methods))
 851       return false;
 852
 853   if (outof_target != 0)
 854     {
 855       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 856          of the sign bit, otherwise we must fill it with zeros.  */
 857       if (binoptab != ashr_optab)
 858         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 859       else
 860         if (!force_expand_binop (word_mode, binoptab,
 861                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 862                                  outof_target, unsignedp, methods))
 863           return false;
 864     }
 865   return true;
 866 }
 867
 868 /* This subroutine of expand_doubleword_shift handles the cases in which
 869    the effective shift value is < BITS_PER_WORD.  The arguments and return
 870    value are the same as for the parent routine.  */
 871
 872 static bool
 873 expand_subword_shift (machine_mode op1_mode, optab binoptab,
 874                       rtx outof_input, rtx into_input, rtx op1,
 875                       rtx outof_target, rtx into_target,
 876                       int unsignedp, enum optab_methods methods,
 877                       unsigned HOST_WIDE_INT shift_mask)
 878 {
 879   optab reverse_unsigned_shift, unsigned_shift;
 880   rtx tmp, carries;
 881
 882   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 883   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 884
 885   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 886      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 887      the opposite direction to BINOPTAB.  */
 888   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 889     {
 890       carries = outof_input;
 891       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 892                                             op1_mode), op1_mode);
 893       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 894                                    0, true, methods);
 895     }
 896   else
 897     {
 898       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 899          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 900          has unknown behavior.  Do a single shift first, then shift by the
 901          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 902          are truncated to the mode size.  */
 903       carries = expand_binop (word_mode, reverse_unsigned_shift,
 904                               outof_input, const1_rtx, 0, unsignedp, methods);
 905       if (shift_mask == BITS_PER_WORD - 1)
 906         {
 907           tmp = immed_wide_int_const
 908             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 909           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 910                                        0, true, methods);
 911         }
 912       else
 913         {
 914           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 915                                                 op1_mode), op1_mode);
 916           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 917                                        0, true, methods);
 918         }
 919     }
 920   if (tmp == 0 || carries == 0)
 921     return false;
 922   carries = expand_binop (word_mode, reverse_unsigned_shift,
 923                           carries, tmp, 0, unsignedp, methods);
 924   if (carries == 0)
 925     return false;
 926
 927   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 928      so the result can go directly into INTO_TARGET if convenient.  */
 929   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 930                       into_target, unsignedp, methods);
 931   if (tmp == 0)
 932     return false;
 933
 934   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 935   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 936                            into_target, unsignedp, methods))
 937     return false;
 938
 939   /* Use a standard word_mode shift for the out-of half.  */
 940   if (outof_target != 0)
 941     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 942                              outof_target, unsignedp, methods))
 943       return false;
 944
 945   return true;
 946 }
 947
 948
 949 #ifdef HAVE_conditional_move
 950 /* Try implementing expand_doubleword_shift using conditional moves.
 951    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 952    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 953    are the shift counts to use in the former and latter case.  All other
 954    arguments are the same as the parent routine.  */
 955
 956 static bool
 957 expand_doubleword_shift_condmove (machine_mode op1_mode, optab binoptab,
 958                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 959                                   rtx outof_input, rtx into_input,
 960                                   rtx subword_op1, rtx superword_op1,
 961                                   rtx outof_target, rtx into_target,
 962                                   int unsignedp, enum optab_methods methods,
 963                                   unsigned HOST_WIDE_INT shift_mask)
 964 {
 965   rtx outof_superword, into_superword;
 966
 967   /* Put the superword version of the output into OUTOF_SUPERWORD and
 968      INTO_SUPERWORD.  */
 969   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 970   if (outof_target != 0 && subword_op1 == superword_op1)
 971     {
 972       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 973          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 974       into_superword = outof_target;
 975       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 976                                    outof_superword, 0, unsignedp, methods))
 977         return false;
 978     }
 979   else
 980     {
 981       into_superword = gen_reg_rtx (word_mode);
 982       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 983                                    outof_superword, into_superword,
 984                                    unsignedp, methods))
 985         return false;
 986     }
 987
 988   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 989   if (!expand_subword_shift (op1_mode, binoptab,
 990                              outof_input, into_input, subword_op1,
 991                              outof_target, into_target,
 992                              unsignedp, methods, shift_mask))
 993     return false;
 994
 995   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 996      might be the current value of OUTOF_TARGET.  */
 997   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 998                               into_target, into_superword, word_mode, false))
 999     return false;
1000
1001   if (outof_target != 0)
1002     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
1003                                 outof_target, outof_superword,
1004                                 word_mode, false))
1005       return false;
1006
1007   return true;
1008 }
1009 #endif
1010
1011 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
1012    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
1013    input operand; the shift moves bits in the direction OUTOF_INPUT->
1014    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
1015    of the target.  OP1 is the shift count and OP1_MODE is its mode.
1016    If OP1 is constant, it will have been truncated as appropriate
1017    and is known to be nonzero.
1018
1019    If SHIFT_MASK is zero, the result of word shifts is undefined when the
1020    shift count is outside the range [0, BITS_PER_WORD).  This routine must
1021    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
1022
1023    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
1024    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
1025    fill with zeros or sign bits as appropriate.
1026
1027    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
1028    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
1029    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
1030    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
1031    are undefined.
1032
1033    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
1034    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
1035    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
1036    function wants to calculate it itself.
1037
1038    Return true if the shift could be successfully synthesized.  */
1039
1040 static bool
1041 expand_doubleword_shift (machine_mode op1_mode, optab binoptab,
1042                          rtx outof_input, rtx into_input, rtx op1,
1043                          rtx outof_target, rtx into_target,
1044                          int unsignedp, enum optab_methods methods,
1045                          unsigned HOST_WIDE_INT shift_mask)
1046 {
1047   rtx superword_op1, tmp, cmp1, cmp2;
1048   enum rtx_code cmp_code;
1049
1050   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
1051      fill the result with sign or zero bits as appropriate.  If so, the value
1052      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
1053      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
1054      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
1055
1056      This isn't worthwhile for constant shifts since the optimizers will
1057      cope better with in-range shift counts.  */
1058   if (shift_mask >= BITS_PER_WORD
1059       && outof_target != 0
1060       && !CONSTANT_P (op1))
1061     {
1062       if (!expand_doubleword_shift (op1_mode, binoptab,
1063                                     outof_input, into_input, op1,
1064                                     0, into_target,
1065                                     unsignedp, methods, shift_mask))
1066         return false;
1067       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
1068                                outof_target, unsignedp, methods))
1069         return false;
1070       return true;
1071     }
1072
1073   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
1074      is true when the effective shift value is less than BITS_PER_WORD.
1075      Set SUPERWORD_OP1 to the shift count that should be used to shift
1076      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
1077   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
1078   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
1079     {
1080       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
1081          is a subword shift count.  */
1082       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
1083                                     0, true, methods);
1084       cmp2 = CONST0_RTX (op1_mode);
1085       cmp_code = EQ;
1086       superword_op1 = op1;
1087     }
1088   else
1089     {
1090       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
1091       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
1092                                     0, true, methods);
1093       cmp2 = CONST0_RTX (op1_mode);
1094       cmp_code = LT;
1095       superword_op1 = cmp1;
1096     }
1097   if (cmp1 == 0)
1098     return false;
1099
1100   /* If we can compute the condition at compile time, pick the
1101      appropriate subroutine.  */
1102   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
1103   if (tmp != 0 && CONST_INT_P (tmp))
1104     {
1105       if (tmp == const0_rtx)
1106         return expand_superword_shift (binoptab, outof_input, superword_op1,
1107                                        outof_target, into_target,
1108                                        unsignedp, methods);
1109       else
1110         return expand_subword_shift (op1_mode, binoptab,
1111                                      outof_input, into_input, op1,
1112                                      outof_target, into_target,
1113                                      unsignedp, methods, shift_mask);
1114     }
1115
1116 #ifdef HAVE_conditional_move
1117   /* Try using conditional moves to generate straight-line code.  */
1118   {
1119     rtx_insn *start = get_last_insn ();
1120     if (expand_doubleword_shift_condmove (op1_mode, binoptab,
1121                                           cmp_code, cmp1, cmp2,
1122                                           outof_input, into_input,
1123                                           op1, superword_op1,
1124                                           outof_target, into_target,
1125                                           unsignedp, methods, shift_mask))
1126       return true;
1127     delete_insns_since (start);
1128   }
1129 #endif
1130
1131   /* As a last resort, use branches to select the correct alternative.  */
1132   rtx_code_label *subword_label = gen_label_rtx ();
1133   rtx_code_label *done_label = gen_label_rtx ();
1134
1135   NO_DEFER_POP;
1136   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
1137                            0, 0, subword_label, -1);
1138   OK_DEFER_POP;
1139
1140   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
1141                                outof_target, into_target,
1142                                unsignedp, methods))
1143     return false;
1144
1145   emit_jump_insn (gen_jump (done_label));
1146   emit_barrier ();
1147   emit_label (subword_label);
1148
1149   if (!expand_subword_shift (op1_mode, binoptab,
1150                              outof_input, into_input, op1,
1151                              outof_target, into_target,
1152                              unsignedp, methods, shift_mask))
1153     return false;
1154
1155   emit_label (done_label);
1156   return true;
1157 }
1158 \f
1159 /* Subroutine of expand_binop.  Perform a double word multiplication of
1160    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
1161    as the target's word_mode.  This function return NULL_RTX if anything
1162    goes wrong, in which case it may have already emitted instructions
1163    which need to be deleted.
1164
1165    If we want to multiply two two-word values and have normal and widening
1166    multiplies of single-word values, we can do this with three smaller
1167    multiplications.
1168
1169    The multiplication proceeds as follows:
1170                                  _______________________
1171                                 [__op0_high_|__op0_low__]
1172                                  _______________________
1173         *                       [__op1_high_|__op1_low__]
1174         _______________________________________________
1175                                  _______________________
1176     (1)                         [__op0_low__*__op1_low__]
1177                      _______________________
1178     (2a)            [__op0_low__*__op1_high_]
1179                      _______________________
1180     (2b)            [__op0_high_*__op1_low__]
1181          _______________________
1182     (3) [__op0_high_*__op1_high_]
1183
1184
1185   This gives a 4-word result.  Since we are only interested in the
1186   lower 2 words, partial result (3) and the upper words of (2a) and
1187   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
1188   calculated using non-widening multiplication.
1189
1190   (1), however, needs to be calculated with an unsigned widening
1191   multiplication.  If this operation is not directly supported we
1192   try using a signed widening multiplication and adjust the result.
1193   This adjustment works as follows:
1194
1195       If both operands are positive then no adjustment is needed.
1196
1197       If the operands have different signs, for example op0_low < 0 and
1198       op1_low >= 0, the instruction treats the most significant bit of
1199       op0_low as a sign bit instead of a bit with significance
1200       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
1201       with 2**BITS_PER_WORD - op0_low, and two's complements the
1202       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
1203       the result.
1204
1205       Similarly, if both operands are negative, we need to add
1206       (op0_low + op1_low) * 2**BITS_PER_WORD.
1207
1208       We use a trick to adjust quickly.  We logically shift op0_low right
1209       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
1210       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
1211       logical shift exists, we do an arithmetic right shift and subtract
1212       the 0 or -1.  */
1213
1214 static rtx
1215 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
1216                        bool umulp, enum optab_methods methods)
1217 {
1218   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
1219   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
1220   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
1221   rtx product, adjust, product_high, temp;
1222
1223   rtx op0_high = operand_subword_force (op0, high, mode);
1224   rtx op0_low = operand_subword_force (op0, low, mode);
1225   rtx op1_high = operand_subword_force (op1, high, mode);
1226   rtx op1_low = operand_subword_force (op1, low, mode);
1227
1228   /* If we're using an unsigned multiply to directly compute the product
1229      of the low-order words of the operands and perform any required
1230      adjustments of the operands, we begin by trying two more multiplications
1231      and then computing the appropriate sum.
1232
1233      We have checked above that the required addition is provided.
1234      Full-word addition will normally always succeed, especially if
1235      it is provided at all, so we don't worry about its failure.  The
1236      multiplication may well fail, however, so we do handle that.  */
1237
1238   if (!umulp)
1239     {
1240       /* ??? This could be done with emit_store_flag where available.  */
1241       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
1242                            NULL_RTX, 1, methods);
1243       if (temp)
1244         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
1245                                  NULL_RTX, 0, OPTAB_DIRECT);
1246       else
1247         {
1248           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
1249                                NULL_RTX, 0, methods);
1250           if (!temp)
1251             return NULL_RTX;
1252           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
1253                                    NULL_RTX, 0, OPTAB_DIRECT);
1254         }
1255
1256       if (!op0_high)
1257         return NULL_RTX;
1258     }
1259
1260   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
1261                          NULL_RTX, 0, OPTAB_DIRECT);
1262   if (!adjust)
1263     return NULL_RTX;
1264
1265   /* OP0_HIGH should now be dead.  */
1266
1267   if (!umulp)
1268     {
1269       /* ??? This could be done with emit_store_flag where available.  */
1270       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
1271                            NULL_RTX, 1, methods);
1272       if (temp)
1273         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
1274                                  NULL_RTX, 0, OPTAB_DIRECT);
1275       else
1276         {
1277           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
1278                                NULL_RTX, 0, methods);
1279           if (!temp)
1280             return NULL_RTX;
1281           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
1282                                    NULL_RTX, 0, OPTAB_DIRECT);
1283         }
1284
1285       if (!op1_high)
1286         return NULL_RTX;
1287     }
1288
1289   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
1290                        NULL_RTX, 0, OPTAB_DIRECT);
1291   if (!temp)
1292     return NULL_RTX;
1293
1294   /* OP1_HIGH should now be dead.  */
1295
1296   adjust = expand_binop (word_mode, add_optab, adjust, temp,
1297                          NULL_RTX, 0, OPTAB_DIRECT);
1298
1299   if (target && !REG_P (target))
1300     target = NULL_RTX;
1301
1302   if (umulp)
1303     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
1304                             target, 1, OPTAB_DIRECT);
1305   else
1306     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
1307                             target, 1, OPTAB_DIRECT);
1308
1309   if (!product)
1310     return NULL_RTX;
1311
1312   product_high = operand_subword (product, high, 1, mode);
1313   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
1314                          NULL_RTX, 0, OPTAB_DIRECT);
1315   emit_move_insn (product_high, adjust);
1316   return product;
1317 }
1318 \f
1319 /* Wrapper around expand_binop which takes an rtx code to specify
1320    the operation to perform, not an optab pointer.  All other
1321    arguments are the same.  */
1322 rtx
1323 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
1324                      rtx op1, rtx target, int unsignedp,
1325                      enum optab_methods methods)
1326 {
1327   optab binop = code_to_optab (code);
1328   gcc_assert (binop);
1329
1330   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
1331 }
1332
1333 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
1334    binop.  Order them according to commutative_operand_precedence and, if
1335    possible, try to put TARGET or a pseudo first.  */
1336 static bool
1337 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
1338 {
1339   int op0_prec = commutative_operand_precedence (op0);
1340   int op1_prec = commutative_operand_precedence (op1);
1341
1342   if (op0_prec < op1_prec)
1343     return true;
1344
1345   if (op0_prec > op1_prec)
1346     return false;
1347
1348   /* With equal precedence, both orders are ok, but it is better if the
1349      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
1350   if (target == 0 || REG_P (target))
1351     return (REG_P (op1) && !REG_P (op0)) || target == op1;
1352   else
1353     return rtx_equal_p (op1, target);
1354 }
1355
1356 /* Return true if BINOPTAB implements a shift operation.  */
1357
1358 static bool
1359 shift_optab_p (optab binoptab)
1360 {
1361   switch (optab_to_code (binoptab))
1362     {
1363     case ASHIFT:
1364     case SS_ASHIFT:
1365     case US_ASHIFT:
1366     case ASHIFTRT:
1367     case LSHIFTRT:
1368     case ROTATE:
1369     case ROTATERT:
1370       return true;
1371
1372     default:
1373       return false;
1374     }
1375 }
1376
1377 /* Return true if BINOPTAB implements a commutative binary operation.  */
1378
1379 static bool
1380 commutative_optab_p (optab binoptab)
1381 {
1382   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
1383           || binoptab == smul_widen_optab
1384           || binoptab == umul_widen_optab
1385           || binoptab == smul_highpart_optab
1386           || binoptab == umul_highpart_optab);
1387 }
1388
1389 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
1390    optimizing, and if the operand is a constant that costs more than
1391    1 instruction, force the constant into a register and return that
1392    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
1393
1394 static rtx
1395 avoid_expensive_constant (machine_mode mode, optab binoptab,
1396                           int opn, rtx x, bool unsignedp)
1397 {
1398   bool speed = optimize_insn_for_speed_p ();
1399
1400   if (mode != VOIDmode
1401       && optimize
1402       && CONSTANT_P (x)
1403       && (rtx_cost (x, optab_to_code (binoptab), opn, speed)
1404           > set_src_cost (x, speed)))
1405     {
1406       if (CONST_INT_P (x))
1407         {
1408           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
1409           if (intval != INTVAL (x))
1410             x = GEN_INT (intval);
1411         }
1412       else
1413         x = convert_modes (mode, VOIDmode, x, unsignedp);
1414       x = force_reg (mode, x);
1415     }
1416   return x;
1417 }
1418
1419 /* Helper function for expand_binop: handle the case where there
1420    is an insn that directly implements the indicated operation.
1421    Returns null if this is not possible.  */
1422 static rtx
1423 expand_binop_directly (machine_mode mode, optab binoptab,
1424                        rtx op0, rtx op1,
1425                        rtx target, int unsignedp, enum optab_methods methods,
1426                        rtx_insn *last)
1427 {
1428   machine_mode from_mode = widened_mode (mode, op0, op1);
1429   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
1430                                                       from_mode, 1);
1431   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1432   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1433   machine_mode mode0, mode1, tmp_mode;
1434   struct expand_operand ops[3];
1435   bool commutative_p;
1436   rtx pat;
1437   rtx xop0 = op0, xop1 = op1;
1438   rtx swap;
1439
1440   /* If it is a commutative operator and the modes would match
1441      if we would swap the operands, we can save the conversions.  */
1442   commutative_p = commutative_optab_p (binoptab);
1443   if (commutative_p
1444       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1445       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1446     {
1447       swap = xop0;
1448       xop0 = xop1;
1449       xop1 = swap;
1450     }
1451
1452   /* If we are optimizing, force expensive constants into a register.  */
1453   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1454   if (!shift_optab_p (binoptab))
1455     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1456
1457   /* In case the insn wants input operands in modes different from
1458      those of the actual operands, convert the operands.  It would
1459      seem that we don't need to convert CONST_INTs, but we do, so
1460      that they're properly zero-extended, sign-extended or truncated
1461      for their mode.  */
1462
1463   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1464   if (xmode0 != VOIDmode && xmode0 != mode0)
1465     {
1466       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1467       mode0 = xmode0;
1468     }
1469
1470   mode1 = GET_MODE (xop1) != VOIDmode ? GET_MODE (xop1) : mode;
1471   if (xmode1 != VOIDmode && xmode1 != mode1)
1472     {
1473       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1474       mode1 = xmode1;
1475     }
1476
1477   /* If operation is commutative,
1478      try to make the first operand a register.
1479      Even better, try to make it the same as the target.
1480      Also try to make the last operand a constant.  */
1481   if (commutative_p
1482       && swap_commutative_operands_with_target (target, xop0, xop1))
1483     {
1484       swap = xop1;
1485       xop1 = xop0;
1486       xop0 = swap;
1487     }
1488
1489   /* Now, if insn's predicates don't allow our operands, put them into
1490      pseudo regs.  */
1491
1492   if (binoptab == vec_pack_trunc_optab
1493       || binoptab == vec_pack_usat_optab
1494       || binoptab == vec_pack_ssat_optab
1495       || binoptab == vec_pack_ufix_trunc_optab
1496       || binoptab == vec_pack_sfix_trunc_optab)
1497     {
1498       /* The mode of the result is different then the mode of the
1499          arguments.  */
1500       tmp_mode = insn_data[(int) icode].operand[0].mode;
1501       if (GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1502         {
1503           delete_insns_since (last);
1504           return NULL_RTX;
1505         }
1506     }
1507   else
1508     tmp_mode = mode;
1509
1510   create_output_operand (&ops[0], target, tmp_mode);
1511   create_input_operand (&ops[1], xop0, mode0);
1512   create_input_operand (&ops[2], xop1, mode1);
1513   pat = maybe_gen_insn (icode, 3, ops);
1514   if (pat)
1515     {
1516       /* If PAT is composed of more than one insn, try to add an appropriate
1517          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1518          operand, call expand_binop again, this time without a target.  */
1519       if (INSN_P (pat) && NEXT_INSN (as_a <rtx_insn *> (pat)) != NULL_RTX
1520           && ! add_equal_note (as_a <rtx_insn *> (pat), ops[0].value,
1521                                optab_to_code (binoptab),
1522                                ops[1].value, ops[2].value))
1523         {
1524           delete_insns_since (last);
1525           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1526                                unsignedp, methods);
1527         }
1528
1529       emit_insn (pat);
1530       return ops[0].value;
1531     }
1532   delete_insns_since (last);
1533   return NULL_RTX;
1534 }
1535
1536 /* Generate code to perform an operation specified by BINOPTAB
1537    on operands OP0 and OP1, with result having machine-mode MODE.
1538
1539    UNSIGNEDP is for the case where we have to widen the operands
1540    to perform the operation.  It says to use zero-extension.
1541
1542    If TARGET is nonzero, the value
1543    is generated there, if it is convenient to do so.
1544    In all cases an rtx is returned for the locus of the value;
1545    this may or may not be TARGET.  */
1546
1547 rtx
1548 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1549               rtx target, int unsignedp, enum optab_methods methods)
1550 {
1551   enum optab_methods next_methods
1552     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1553        ? OPTAB_WIDEN : methods);
1554   enum mode_class mclass;
1555   machine_mode wider_mode;
1556   rtx libfunc;
1557   rtx temp;
1558   rtx_insn *entry_last = get_last_insn ();
1559   rtx_insn *last;
1560
1561   mclass = GET_MODE_CLASS (mode);
1562
1563   /* If subtracting an integer constant, convert this into an addition of
1564      the negated constant.  */
1565
1566   if (binoptab == sub_optab && CONST_INT_P (op1))
1567     {
1568       op1 = negate_rtx (mode, op1);
1569       binoptab = add_optab;
1570     }
1571
1572   /* Record where to delete back to if we backtrack.  */
1573   last = get_last_insn ();
1574
1575   /* If we can do it with a three-operand insn, do so.  */
1576
1577   if (methods != OPTAB_MUST_WIDEN
1578       && find_widening_optab_handler (binoptab, mode,
1579                                       widened_mode (mode, op0, op1), 1)
1580             != CODE_FOR_nothing)
1581     {
1582       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1583                                     unsignedp, methods, last);
1584       if (temp)
1585         return temp;
1586     }
1587
1588   /* If we were trying to rotate, and that didn't work, try rotating
1589      the other direction before falling back to shifts and bitwise-or.  */
1590   if (((binoptab == rotl_optab
1591         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1592        || (binoptab == rotr_optab
1593            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1594       && mclass == MODE_INT)
1595     {
1596       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1597       rtx newop1;
1598       unsigned int bits = GET_MODE_PRECISION (mode);
1599
1600       if (CONST_INT_P (op1))
1601         newop1 = GEN_INT (bits - INTVAL (op1));
1602       else if (targetm.shift_truncation_mask (mode) == bits - 1)
1603         newop1 = negate_rtx (GET_MODE (op1), op1);
1604       else
1605         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1606                                gen_int_mode (bits, GET_MODE (op1)), op1,
1607                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1608
1609       temp = expand_binop_directly (mode, otheroptab, op0, newop1,
1610                                     target, unsignedp, methods, last);
1611       if (temp)
1612         return temp;
1613     }
1614
1615   /* If this is a multiply, see if we can do a widening operation that
1616      takes operands of this mode and makes a wider mode.  */
1617
1618   if (binoptab == smul_optab
1619       && GET_MODE_2XWIDER_MODE (mode) != VOIDmode
1620       && (widening_optab_handler ((unsignedp ? umul_widen_optab
1621                                              : smul_widen_optab),
1622                                   GET_MODE_2XWIDER_MODE (mode), mode)
1623           != CODE_FOR_nothing))
1624     {
1625       temp = expand_binop (GET_MODE_2XWIDER_MODE (mode),
1626                            unsignedp ? umul_widen_optab : smul_widen_optab,
1627                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1628
1629       if (temp != 0)
1630         {
1631           if (GET_MODE_CLASS (mode) == MODE_INT
1632               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1633             return gen_lowpart (mode, temp);
1634           else
1635             return convert_to_mode (mode, temp, unsignedp);
1636         }
1637     }
1638
1639   /* If this is a vector shift by a scalar, see if we can do a vector
1640      shift by a vector.  If so, broadcast the scalar into a vector.  */
1641   if (mclass == MODE_VECTOR_INT)
1642     {
1643       optab otheroptab = unknown_optab;
1644
1645       if (binoptab == ashl_optab)
1646         otheroptab = vashl_optab;
1647       else if (binoptab == ashr_optab)
1648         otheroptab = vashr_optab;
1649       else if (binoptab == lshr_optab)
1650         otheroptab = vlshr_optab;
1651       else if (binoptab == rotl_optab)
1652         otheroptab = vrotl_optab;
1653       else if (binoptab == rotr_optab)
1654         otheroptab = vrotr_optab;
1655
1656       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1657         {
1658           rtx vop1 = expand_vector_broadcast (mode, op1);
1659           if (vop1)
1660             {
1661               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1662                                             target, unsignedp, methods, last);
1663               if (temp)
1664                 return temp;
1665             }
1666         }
1667     }
1668
1669   /* Look for a wider mode of the same class for which we think we
1670      can open-code the operation.  Check for a widening multiply at the
1671      wider mode as well.  */
1672
1673   if (CLASS_HAS_WIDER_MODES_P (mclass)
1674       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1675     for (wider_mode = GET_MODE_WIDER_MODE (mode);
1676          wider_mode != VOIDmode;
1677          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
1678       {
1679         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1680             || (binoptab == smul_optab
1681                 && GET_MODE_WIDER_MODE (wider_mode) != VOIDmode
1682                 && (find_widening_optab_handler ((unsignedp
1683                                                   ? umul_widen_optab
1684                                                   : smul_widen_optab),
1685                                                  GET_MODE_WIDER_MODE (wider_mode),
1686                                                  mode, 0)
1687                     != CODE_FOR_nothing)))
1688           {
1689             rtx xop0 = op0, xop1 = op1;
1690             int no_extend = 0;
1691
1692             /* For certain integer operations, we need not actually extend
1693                the narrow operands, as long as we will truncate
1694                the results to the same narrowness.  */
1695
1696             if ((binoptab == ior_optab || binoptab == and_optab
1697                  || binoptab == xor_optab
1698                  || binoptab == add_optab || binoptab == sub_optab
1699                  || binoptab == smul_optab || binoptab == ashl_optab)
1700                 && mclass == MODE_INT)
1701               {
1702                 no_extend = 1;
1703                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1704                                                  xop0, unsignedp);
1705                 if (binoptab != ashl_optab)
1706                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1707                                                    xop1, unsignedp);
1708               }
1709
1710             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1711
1712             /* The second operand of a shift must always be extended.  */
1713             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1714                                   no_extend && binoptab != ashl_optab);
1715
1716             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1717                                  unsignedp, OPTAB_DIRECT);
1718             if (temp)
1719               {
1720                 if (mclass != MODE_INT
1721                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1722                   {
1723                     if (target == 0)
1724                       target = gen_reg_rtx (mode);
1725                     convert_move (target, temp, 0);
1726                     return target;
1727                   }
1728                 else
1729                   return gen_lowpart (mode, temp);
1730               }
1731             else
1732               delete_insns_since (last);
1733           }
1734       }
1735
1736   /* If operation is commutative,
1737      try to make the first operand a register.
1738      Even better, try to make it the same as the target.
1739      Also try to make the last operand a constant.  */
1740   if (commutative_optab_p (binoptab)
1741       && swap_commutative_operands_with_target (target, op0, op1))
1742     {
1743       temp = op1;
1744       op1 = op0;
1745       op0 = temp;
1746     }
1747
1748   /* These can be done a word at a time.  */
1749   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1750       && mclass == MODE_INT
1751       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
1752       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1753     {
1754       int i;
1755       rtx_insn *insns;
1756
1757       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1758          won't be accurate, so use a new target.  */
1759       if (target == 0
1760           || target == op0
1761           || target == op1
1762           || !valid_multiword_target_p (target))
1763         target = gen_reg_rtx (mode);
1764
1765       start_sequence ();
1766
1767       /* Do the actual arithmetic.  */
1768       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
1769         {
1770           rtx target_piece = operand_subword (target, i, 1, mode);
1771           rtx x = expand_binop (word_mode, binoptab,
1772                                 operand_subword_force (op0, i, mode),
1773                                 operand_subword_force (op1, i, mode),
1774                                 target_piece, unsignedp, next_methods);
1775
1776           if (x == 0)
1777             break;
1778
1779           if (target_piece != x)
1780             emit_move_insn (target_piece, x);
1781         }
1782
1783       insns = get_insns ();
1784       end_sequence ();
1785
1786       if (i == GET_MODE_BITSIZE (mode) / BITS_PER_WORD)
1787         {
1788           emit_insn (insns);
1789           return target;
1790         }
1791     }
1792
1793   /* Synthesize double word shifts from single word shifts.  */
1794   if ((binoptab == lshr_optab || binoptab == ashl_optab
1795        || binoptab == ashr_optab)
1796       && mclass == MODE_INT
1797       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1798       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1799       && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode)
1800       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1801       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1802       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1803     {
1804       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1805       machine_mode op1_mode;
1806
1807       double_shift_mask = targetm.shift_truncation_mask (mode);
1808       shift_mask = targetm.shift_truncation_mask (word_mode);
1809       op1_mode = GET_MODE (op1) != VOIDmode ? GET_MODE (op1) : word_mode;
1810
1811       /* Apply the truncation to constant shifts.  */
1812       if (double_shift_mask > 0 && CONST_INT_P (op1))
1813         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1814
1815       if (op1 == CONST0_RTX (op1_mode))
1816         return op0;
1817
1818       /* Make sure that this is a combination that expand_doubleword_shift
1819          can handle.  See the comments there for details.  */
1820       if (double_shift_mask == 0
1821           || (shift_mask == BITS_PER_WORD - 1
1822               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1823         {
1824           rtx_insn *insns;
1825           rtx into_target, outof_target;
1826           rtx into_input, outof_input;
1827           int left_shift, outof_word;
1828
1829           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1830              won't be accurate, so use a new target.  */
1831           if (target == 0
1832               || target == op0
1833               || target == op1
1834               || !valid_multiword_target_p (target))
1835             target = gen_reg_rtx (mode);
1836
1837           start_sequence ();
1838
1839           /* OUTOF_* is the word we are shifting bits away from, and
1840              INTO_* is the word that we are shifting bits towards, thus
1841              they differ depending on the direction of the shift and
1842              WORDS_BIG_ENDIAN.  */
1843
1844           left_shift = binoptab == ashl_optab;
1845           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1846
1847           outof_target = operand_subword (target, outof_word, 1, mode);
1848           into_target = operand_subword (target, 1 - outof_word, 1, mode);
1849
1850           outof_input = operand_subword_force (op0, outof_word, mode);
1851           into_input = operand_subword_force (op0, 1 - outof_word, mode);
1852
1853           if (expand_doubleword_shift (op1_mode, binoptab,
1854                                        outof_input, into_input, op1,
1855                                        outof_target, into_target,
1856                                        unsignedp, next_methods, shift_mask))
1857             {
1858               insns = get_insns ();
1859               end_sequence ();
1860
1861               emit_insn (insns);
1862               return target;
1863             }
1864           end_sequence ();
1865         }
1866     }
1867
1868   /* Synthesize double word rotates from single word shifts.  */
1869   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1870       && mclass == MODE_INT
1871       && CONST_INT_P (op1)
1872       && GET_MODE_PRECISION (mode) == 2 * BITS_PER_WORD
1873       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1874       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1875     {
1876       rtx_insn *insns;
1877       rtx into_target, outof_target;
1878       rtx into_input, outof_input;
1879       rtx inter;
1880       int shift_count, left_shift, outof_word;
1881
1882       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1883          won't be accurate, so use a new target. Do this also if target is not
1884          a REG, first because having a register instead may open optimization
1885          opportunities, and second because if target and op0 happen to be MEMs
1886          designating the same location, we would risk clobbering it too early
1887          in the code sequence we generate below.  */
1888       if (target == 0
1889           || target == op0
1890           || target == op1
1891           || !REG_P (target)
1892           || !valid_multiword_target_p (target))
1893         target = gen_reg_rtx (mode);
1894
1895       start_sequence ();
1896
1897       shift_count = INTVAL (op1);
1898
1899       /* OUTOF_* is the word we are shifting bits away from, and
1900          INTO_* is the word that we are shifting bits towards, thus
1901          they differ depending on the direction of the shift and
1902          WORDS_BIG_ENDIAN.  */
1903
1904       left_shift = (binoptab == rotl_optab);
1905       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1906
1907       outof_target = operand_subword (target, outof_word, 1, mode);
1908       into_target = operand_subword (target, 1 - outof_word, 1, mode);
1909
1910       outof_input = operand_subword_force (op0, outof_word, mode);
1911       into_input = operand_subword_force (op0, 1 - outof_word, mode);
1912
1913       if (shift_count == BITS_PER_WORD)
1914         {
1915           /* This is just a word swap.  */
1916           emit_move_insn (outof_target, into_input);
1917           emit_move_insn (into_target, outof_input);
1918           inter = const0_rtx;
1919         }
1920       else
1921         {
1922           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1923           rtx first_shift_count, second_shift_count;
1924           optab reverse_unsigned_shift, unsigned_shift;
1925
1926           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1927                                     ? lshr_optab : ashl_optab);
1928
1929           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1930                             ? ashl_optab : lshr_optab);
1931
1932           if (shift_count > BITS_PER_WORD)
1933             {
1934               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1935               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1936             }
1937           else
1938             {
1939               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1940               second_shift_count = GEN_INT (shift_count);
1941             }
1942
1943           into_temp1 = expand_binop (word_mode, unsigned_shift,
1944                                      outof_input, first_shift_count,
1945                                      NULL_RTX, unsignedp, next_methods);
1946           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1947                                      into_input, second_shift_count,
1948                                      NULL_RTX, unsignedp, next_methods);
1949
1950           if (into_temp1 != 0 && into_temp2 != 0)
1951             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1952                                   into_target, unsignedp, next_methods);
1953           else
1954             inter = 0;
1955
1956           if (inter != 0 && inter != into_target)
1957             emit_move_insn (into_target, inter);
1958
1959           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1960                                       into_input, first_shift_count,
1961                                       NULL_RTX, unsignedp, next_methods);
1962           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1963                                       outof_input, second_shift_count,
1964                                       NULL_RTX, unsignedp, next_methods);
1965
1966           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1967             inter = expand_binop (word_mode, ior_optab,
1968                                   outof_temp1, outof_temp2,
1969                                   outof_target, unsignedp, next_methods);
1970
1971           if (inter != 0 && inter != outof_target)
1972             emit_move_insn (outof_target, inter);
1973         }
1974
1975       insns = get_insns ();
1976       end_sequence ();
1977
1978       if (inter != 0)
1979         {
1980           emit_insn (insns);
1981           return target;
1982         }
1983     }
1984
1985   /* These can be done a word at a time by propagating carries.  */
1986   if ((binoptab == add_optab || binoptab == sub_optab)
1987       && mclass == MODE_INT
1988       && GET_MODE_SIZE (mode) >= 2 * UNITS_PER_WORD
1989       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1990     {
1991       unsigned int i;
1992       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1993       const unsigned int nwords = GET_MODE_BITSIZE (mode) / BITS_PER_WORD;
1994       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1995       rtx xop0, xop1, xtarget;
1996
1997       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1998          value is one of those, use it.  Otherwise, use 1 since it is the
1999          one easiest to get.  */
2000 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
2001       int normalizep = STORE_FLAG_VALUE;
2002 #else
2003       int normalizep = 1;
2004 #endif
2005
2006       /* Prepare the operands.  */
2007       xop0 = force_reg (mode, op0);
2008       xop1 = force_reg (mode, op1);
2009
2010       xtarget = gen_reg_rtx (mode);
2011
2012       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
2013         target = xtarget;
2014
2015       /* Indicate for flow that the entire target reg is being set.  */
2016       if (REG_P (target))
2017         emit_clobber (xtarget);
2018
2019       /* Do the actual arithmetic.  */
2020       for (i = 0; i < nwords; i++)
2021         {
2022           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
2023           rtx target_piece = operand_subword (xtarget, index, 1, mode);
2024           rtx op0_piece = operand_subword_force (xop0, index, mode);
2025           rtx op1_piece = operand_subword_force (xop1, index, mode);
2026           rtx x;
2027
2028           /* Main add/subtract of the input operands.  */
2029           x = expand_binop (word_mode, binoptab,
2030                             op0_piece, op1_piece,
2031                             target_piece, unsignedp, next_methods);
2032           if (x == 0)
2033             break;
2034
2035           if (i + 1 < nwords)
2036             {
2037               /* Store carry from main add/subtract.  */
2038               carry_out = gen_reg_rtx (word_mode);
2039               carry_out = emit_store_flag_force (carry_out,
2040                                                  (binoptab == add_optab
2041                                                   ? LT : GT),
2042                                                  x, op0_piece,
2043                                                  word_mode, 1, normalizep);
2044             }
2045
2046           if (i > 0)
2047             {
2048               rtx newx;
2049
2050               /* Add/subtract previous carry to main result.  */
2051               newx = expand_binop (word_mode,
2052                                    normalizep == 1 ? binoptab : otheroptab,
2053                                    x, carry_in,
2054                                    NULL_RTX, 1, next_methods);
2055
2056               if (i + 1 < nwords)
2057                 {
2058                   /* Get out carry from adding/subtracting carry in.  */
2059                   rtx carry_tmp = gen_reg_rtx (word_mode);
2060                   carry_tmp = emit_store_flag_force (carry_tmp,
2061                                                      (binoptab == add_optab
2062                                                       ? LT : GT),
2063                                                      newx, x,
2064                                                      word_mode, 1, normalizep);
2065
2066                   /* Logical-ior the two poss. carry together.  */
2067                   carry_out = expand_binop (word_mode, ior_optab,
2068                                             carry_out, carry_tmp,
2069                                             carry_out, 0, next_methods);
2070                   if (carry_out == 0)
2071                     break;
2072                 }
2073               emit_move_insn (target_piece, newx);
2074             }
2075           else
2076             {
2077               if (x != target_piece)
2078                 emit_move_insn (target_piece, x);
2079             }
2080
2081           carry_in = carry_out;
2082         }
2083
2084       if (i == GET_MODE_BITSIZE (mode) / (unsigned) BITS_PER_WORD)
2085         {
2086           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing
2087               || ! rtx_equal_p (target, xtarget))
2088             {
2089               rtx temp = emit_move_insn (target, xtarget);
2090
2091               set_dst_reg_note (temp, REG_EQUAL,
2092                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2093                                                 mode, copy_rtx (xop0),
2094                                                 copy_rtx (xop1)),
2095                                 target);
2096             }
2097           else
2098             target = xtarget;
2099
2100           return target;
2101         }
2102
2103       else
2104         delete_insns_since (last);
2105     }
2106
2107   /* Attempt to synthesize double word multiplies using a sequence of word
2108      mode multiplications.  We first attempt to generate a sequence using a
2109      more efficient unsigned widening multiply, and if that fails we then
2110      try using a signed widening multiply.  */
2111
2112   if (binoptab == smul_optab
2113       && mclass == MODE_INT
2114       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2115       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
2116       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
2117     {
2118       rtx product = NULL_RTX;
2119       if (widening_optab_handler (umul_widen_optab, mode, word_mode)
2120             != CODE_FOR_nothing)
2121         {
2122           product = expand_doubleword_mult (mode, op0, op1, target,
2123                                             true, methods);
2124           if (!product)
2125             delete_insns_since (last);
2126         }
2127
2128       if (product == NULL_RTX
2129           && widening_optab_handler (smul_widen_optab, mode, word_mode)
2130                 != CODE_FOR_nothing)
2131         {
2132           product = expand_doubleword_mult (mode, op0, op1, target,
2133                                             false, methods);
2134           if (!product)
2135             delete_insns_since (last);
2136         }
2137
2138       if (product != NULL_RTX)
2139         {
2140           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing)
2141             {
2142               temp = emit_move_insn (target ? target : product, product);
2143               set_dst_reg_note (temp,
2144                                 REG_EQUAL,
2145                                 gen_rtx_fmt_ee (MULT, mode,
2146                                                 copy_rtx (op0),
2147                                                 copy_rtx (op1)),
2148                                 target ? target : product);
2149             }
2150           return product;
2151         }
2152     }
2153
2154   /* It can't be open-coded in this mode.
2155      Use a library call if one is available and caller says that's ok.  */
2156
2157   libfunc = optab_libfunc (binoptab, mode);
2158   if (libfunc
2159       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
2160     {
2161       rtx_insn *insns;
2162       rtx op1x = op1;
2163       machine_mode op1_mode = mode;
2164       rtx value;
2165
2166       start_sequence ();
2167
2168       if (shift_optab_p (binoptab))
2169         {
2170           op1_mode = targetm.libgcc_shift_count_mode ();
2171           /* Specify unsigned here,
2172              since negative shift counts are meaningless.  */
2173           op1x = convert_to_mode (op1_mode, op1, 1);
2174         }
2175
2176       if (GET_MODE (op0) != VOIDmode
2177           && GET_MODE (op0) != mode)
2178         op0 = convert_to_mode (mode, op0, unsignedp);
2179
2180       /* Pass 1 for NO_QUEUE so we don't lose any increments
2181          if the libcall is cse'd or moved.  */
2182       value = emit_library_call_value (libfunc,
2183                                        NULL_RTX, LCT_CONST, mode, 2,
2184                                        op0, mode, op1x, op1_mode);
2185
2186       insns = get_insns ();
2187       end_sequence ();
2188
2189       target = gen_reg_rtx (mode);
2190       emit_libcall_block_1 (insns, target, value,
2191                             gen_rtx_fmt_ee (optab_to_code (binoptab),
2192                                             mode, op0, op1),
2193                             trapv_binoptab_p (binoptab));
2194
2195       return target;
2196     }
2197
2198   delete_insns_since (last);
2199
2200   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2201
2202   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
2203          || methods == OPTAB_MUST_WIDEN))
2204     {
2205       /* Caller says, don't even try.  */
2206       delete_insns_since (entry_last);
2207       return 0;
2208     }
2209
2210   /* Compute the value of METHODS to pass to recursive calls.
2211      Don't allow widening to be tried recursively.  */
2212
2213   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
2214
2215   /* Look for a wider mode of the same class for which it appears we can do
2216      the operation.  */
2217
2218   if (CLASS_HAS_WIDER_MODES_P (mclass))
2219     {
2220       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2221            wider_mode != VOIDmode;
2222            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2223         {
2224           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
2225                   != CODE_FOR_nothing
2226               || (methods == OPTAB_LIB
2227                   && optab_libfunc (binoptab, wider_mode)))
2228             {
2229               rtx xop0 = op0, xop1 = op1;
2230               int no_extend = 0;
2231
2232               /* For certain integer operations, we need not actually extend
2233                  the narrow operands, as long as we will truncate
2234                  the results to the same narrowness.  */
2235
2236               if ((binoptab == ior_optab || binoptab == and_optab
2237                    || binoptab == xor_optab
2238                    || binoptab == add_optab || binoptab == sub_optab
2239                    || binoptab == smul_optab || binoptab == ashl_optab)
2240                   && mclass == MODE_INT)
2241                 no_extend = 1;
2242
2243               xop0 = widen_operand (xop0, wider_mode, mode,
2244                                     unsignedp, no_extend);
2245
2246               /* The second operand of a shift must always be extended.  */
2247               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
2248                                     no_extend && binoptab != ashl_optab);
2249
2250               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
2251                                    unsignedp, methods);
2252               if (temp)
2253                 {
2254                   if (mclass != MODE_INT
2255                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2256                     {
2257                       if (target == 0)
2258                         target = gen_reg_rtx (mode);
2259                       convert_move (target, temp, 0);
2260                       return target;
2261                     }
2262                   else
2263                     return gen_lowpart (mode, temp);
2264                 }
2265               else
2266                 delete_insns_since (last);
2267             }
2268         }
2269     }
2270
2271   delete_insns_since (entry_last);
2272   return 0;
2273 }
2274 \f
2275 /* Expand a binary operator which has both signed and unsigned forms.
2276    UOPTAB is the optab for unsigned operations, and SOPTAB is for
2277    signed operations.
2278
2279    If we widen unsigned operands, we may use a signed wider operation instead
2280    of an unsigned wider operation, since the result would be the same.  */
2281
2282 rtx
2283 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
2284                    rtx op0, rtx op1, rtx target, int unsignedp,
2285                    enum optab_methods methods)
2286 {
2287   rtx temp;
2288   optab direct_optab = unsignedp ? uoptab : soptab;
2289   bool save_enable;
2290
2291   /* Do it without widening, if possible.  */
2292   temp = expand_binop (mode, direct_optab, op0, op1, target,
2293                        unsignedp, OPTAB_DIRECT);
2294   if (temp || methods == OPTAB_DIRECT)
2295     return temp;
2296
2297   /* Try widening to a signed int.  Disable any direct use of any
2298      signed insn in the current mode.  */
2299   save_enable = swap_optab_enable (soptab, mode, false);
2300
2301   temp = expand_binop (mode, soptab, op0, op1, target,
2302                        unsignedp, OPTAB_WIDEN);
2303
2304   /* For unsigned operands, try widening to an unsigned int.  */
2305   if (!temp && unsignedp)
2306     temp = expand_binop (mode, uoptab, op0, op1, target,
2307                          unsignedp, OPTAB_WIDEN);
2308   if (temp || methods == OPTAB_WIDEN)
2309     goto egress;
2310
2311   /* Use the right width libcall if that exists.  */
2312   temp = expand_binop (mode, direct_optab, op0, op1, target,
2313                        unsignedp, OPTAB_LIB);
2314   if (temp || methods == OPTAB_LIB)
2315     goto egress;
2316
2317   /* Must widen and use a libcall, use either signed or unsigned.  */
2318   temp = expand_binop (mode, soptab, op0, op1, target,
2319                        unsignedp, methods);
2320   if (!temp && unsignedp)
2321     temp = expand_binop (mode, uoptab, op0, op1, target,
2322                          unsignedp, methods);
2323
2324  egress:
2325   /* Undo the fiddling above.  */
2326   if (save_enable)
2327     swap_optab_enable (soptab, mode, true);
2328   return temp;
2329 }
2330 \f
2331 /* Generate code to perform an operation specified by UNOPPTAB
2332    on operand OP0, with two results to TARG0 and TARG1.
2333    We assume that the order of the operands for the instruction
2334    is TARG0, TARG1, OP0.
2335
2336    Either TARG0 or TARG1 may be zero, but what that means is that
2337    the result is not actually wanted.  We will generate it into
2338    a dummy pseudo-reg and discard it.  They may not both be zero.
2339
2340    Returns 1 if this operation can be performed; 0 if not.  */
2341
2342 int
2343 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
2344                     int unsignedp)
2345 {
2346   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2347   enum mode_class mclass;
2348   machine_mode wider_mode;
2349   rtx_insn *entry_last = get_last_insn ();
2350   rtx_insn *last;
2351
2352   mclass = GET_MODE_CLASS (mode);
2353
2354   if (!targ0)
2355     targ0 = gen_reg_rtx (mode);
2356   if (!targ1)
2357     targ1 = gen_reg_rtx (mode);
2358
2359   /* Record where to go back to if we fail.  */
2360   last = get_last_insn ();
2361
2362   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2363     {
2364       struct expand_operand ops[3];
2365       enum insn_code icode = optab_handler (unoptab, mode);
2366
2367       create_fixed_operand (&ops[0], targ0);
2368       create_fixed_operand (&ops[1], targ1);
2369       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
2370       if (maybe_expand_insn (icode, 3, ops))
2371         return 1;
2372     }
2373
2374   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2375
2376   if (CLASS_HAS_WIDER_MODES_P (mclass))
2377     {
2378       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2379            wider_mode != VOIDmode;
2380            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2381         {
2382           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2383             {
2384               rtx t0 = gen_reg_rtx (wider_mode);
2385               rtx t1 = gen_reg_rtx (wider_mode);
2386               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2387
2388               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2389                 {
2390                   convert_move (targ0, t0, unsignedp);
2391                   convert_move (targ1, t1, unsignedp);
2392                   return 1;
2393                 }
2394               else
2395                 delete_insns_since (last);
2396             }
2397         }
2398     }
2399
2400   delete_insns_since (entry_last);
2401   return 0;
2402 }
2403 \f
2404 /* Generate code to perform an operation specified by BINOPTAB
2405    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2406    We assume that the order of the operands for the instruction
2407    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2408    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2409
2410    Either TARG0 or TARG1 may be zero, but what that means is that
2411    the result is not actually wanted.  We will generate it into
2412    a dummy pseudo-reg and discard it.  They may not both be zero.
2413
2414    Returns 1 if this operation can be performed; 0 if not.  */
2415
2416 int
2417 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2418                      int unsignedp)
2419 {
2420   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2421   enum mode_class mclass;
2422   machine_mode wider_mode;
2423   rtx_insn *entry_last = get_last_insn ();
2424   rtx_insn *last;
2425
2426   mclass = GET_MODE_CLASS (mode);
2427
2428   if (!targ0)
2429     targ0 = gen_reg_rtx (mode);
2430   if (!targ1)
2431     targ1 = gen_reg_rtx (mode);
2432
2433   /* Record where to go back to if we fail.  */
2434   last = get_last_insn ();
2435
2436   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2437     {
2438       struct expand_operand ops[4];
2439       enum insn_code icode = optab_handler (binoptab, mode);
2440       machine_mode mode0 = insn_data[icode].operand[1].mode;
2441       machine_mode mode1 = insn_data[icode].operand[2].mode;
2442       rtx xop0 = op0, xop1 = op1;
2443
2444       /* If we are optimizing, force expensive constants into a register.  */
2445       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2446       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2447
2448       create_fixed_operand (&ops[0], targ0);
2449       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2450       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2451       create_fixed_operand (&ops[3], targ1);
2452       if (maybe_expand_insn (icode, 4, ops))
2453         return 1;
2454       delete_insns_since (last);
2455     }
2456
2457   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2458
2459   if (CLASS_HAS_WIDER_MODES_P (mclass))
2460     {
2461       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2462            wider_mode != VOIDmode;
2463            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2464         {
2465           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2466             {
2467               rtx t0 = gen_reg_rtx (wider_mode);
2468               rtx t1 = gen_reg_rtx (wider_mode);
2469               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2470               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2471
2472               if (expand_twoval_binop (binoptab, cop0, cop1,
2473                                        t0, t1, unsignedp))
2474                 {
2475                   convert_move (targ0, t0, unsignedp);
2476                   convert_move (targ1, t1, unsignedp);
2477                   return 1;
2478                 }
2479               else
2480                 delete_insns_since (last);
2481             }
2482         }
2483     }
2484
2485   delete_insns_since (entry_last);
2486   return 0;
2487 }
2488
2489 /* Expand the two-valued library call indicated by BINOPTAB, but
2490    preserve only one of the values.  If TARG0 is non-NULL, the first
2491    value is placed into TARG0; otherwise the second value is placed
2492    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2493    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2494    This routine assumes that the value returned by the library call is
2495    as if the return value was of an integral mode twice as wide as the
2496    mode of OP0.  Returns 1 if the call was successful.  */
2497
2498 bool
2499 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2500                              rtx targ0, rtx targ1, enum rtx_code code)
2501 {
2502   machine_mode mode;
2503   machine_mode libval_mode;
2504   rtx libval;
2505   rtx_insn *insns;
2506   rtx libfunc;
2507
2508   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2509   gcc_assert (!targ0 != !targ1);
2510
2511   mode = GET_MODE (op0);
2512   libfunc = optab_libfunc (binoptab, mode);
2513   if (!libfunc)
2514     return false;
2515
2516   /* The value returned by the library function will have twice as
2517      many bits as the nominal MODE.  */
2518   libval_mode = smallest_mode_for_size (2 * GET_MODE_BITSIZE (mode),
2519                                         MODE_INT);
2520   start_sequence ();
2521   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2522                                     libval_mode, 2,
2523                                     op0, mode,
2524                                     op1, mode);
2525   /* Get the part of VAL containing the value that we want.  */
2526   libval = simplify_gen_subreg (mode, libval, libval_mode,
2527                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2528   insns = get_insns ();
2529   end_sequence ();
2530   /* Move the into the desired location.  */
2531   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2532                       gen_rtx_fmt_ee (code, mode, op0, op1));
2533
2534   return true;
2535 }
2536
2537 \f
2538 /* Wrapper around expand_unop which takes an rtx code to specify
2539    the operation to perform, not an optab pointer.  All other
2540    arguments are the same.  */
2541 rtx
2542 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2543                     rtx target, int unsignedp)
2544 {
2545   optab unop = code_to_optab (code);
2546   gcc_assert (unop);
2547
2548   return expand_unop (mode, unop, op0, target, unsignedp);
2549 }
2550
2551 /* Try calculating
2552         (clz:narrow x)
2553    as
2554         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2555
2556    A similar operation can be used for clrsb.  UNOPTAB says which operation
2557    we are trying to expand.  */
2558 static rtx
2559 widen_leading (machine_mode mode, rtx op0, rtx target, optab unoptab)
2560 {
2561   enum mode_class mclass = GET_MODE_CLASS (mode);
2562   if (CLASS_HAS_WIDER_MODES_P (mclass))
2563     {
2564       machine_mode wider_mode;
2565       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2566            wider_mode != VOIDmode;
2567            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2568         {
2569           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2570             {
2571               rtx xop0, temp;
2572               rtx_insn *last;
2573
2574               last = get_last_insn ();
2575
2576               if (target == 0)
2577                 target = gen_reg_rtx (mode);
2578               xop0 = widen_operand (op0, wider_mode, mode,
2579                                     unoptab != clrsb_optab, false);
2580               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2581                                   unoptab != clrsb_optab);
2582               if (temp != 0)
2583                 temp = expand_binop
2584                   (wider_mode, sub_optab, temp,
2585                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
2586                                  - GET_MODE_PRECISION (mode),
2587                                  wider_mode),
2588                    target, true, OPTAB_DIRECT);
2589               if (temp == 0)
2590                 delete_insns_since (last);
2591
2592               return temp;
2593             }
2594         }
2595     }
2596   return 0;
2597 }
2598
2599 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2600    quantities, choosing which based on whether the high word is nonzero.  */
2601 static rtx
2602 expand_doubleword_clz (machine_mode mode, rtx op0, rtx target)
2603 {
2604   rtx xop0 = force_reg (mode, op0);
2605   rtx subhi = gen_highpart (word_mode, xop0);
2606   rtx sublo = gen_lowpart (word_mode, xop0);
2607   rtx_code_label *hi0_label = gen_label_rtx ();
2608   rtx_code_label *after_label = gen_label_rtx ();
2609   rtx_insn *seq;
2610   rtx temp, result;
2611
2612   /* If we were not given a target, use a word_mode register, not a
2613      'mode' register.  The result will fit, and nobody is expecting
2614      anything bigger (the return type of __builtin_clz* is int).  */
2615   if (!target)
2616     target = gen_reg_rtx (word_mode);
2617
2618   /* In any case, write to a word_mode scratch in both branches of the
2619      conditional, so we can ensure there is a single move insn setting
2620      'target' to tag a REG_EQUAL note on.  */
2621   result = gen_reg_rtx (word_mode);
2622
2623   start_sequence ();
2624
2625   /* If the high word is not equal to zero,
2626      then clz of the full value is clz of the high word.  */
2627   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2628                            word_mode, true, hi0_label);
2629
2630   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2631   if (!temp)
2632     goto fail;
2633
2634   if (temp != result)
2635     convert_move (result, temp, true);
2636
2637   emit_jump_insn (gen_jump (after_label));
2638   emit_barrier ();
2639
2640   /* Else clz of the full value is clz of the low word plus the number
2641      of bits in the high word.  */
2642   emit_label (hi0_label);
2643
2644   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2645   if (!temp)
2646     goto fail;
2647   temp = expand_binop (word_mode, add_optab, temp,
2648                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2649                        result, true, OPTAB_DIRECT);
2650   if (!temp)
2651     goto fail;
2652   if (temp != result)
2653     convert_move (result, temp, true);
2654
2655   emit_label (after_label);
2656   convert_move (target, result, true);
2657
2658   seq = get_insns ();
2659   end_sequence ();
2660
2661   add_equal_note (seq, target, CLZ, xop0, 0);
2662   emit_insn (seq);
2663   return target;
2664
2665  fail:
2666   end_sequence ();
2667   return 0;
2668 }
2669
2670 /* Try calculating
2671         (bswap:narrow x)
2672    as
2673         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2674 static rtx
2675 widen_bswap (machine_mode mode, rtx op0, rtx target)
2676 {
2677   enum mode_class mclass = GET_MODE_CLASS (mode);
2678   machine_mode wider_mode;
2679   rtx x;
2680   rtx_insn *last;
2681
2682   if (!CLASS_HAS_WIDER_MODES_P (mclass))
2683     return NULL_RTX;
2684
2685   for (wider_mode = GET_MODE_WIDER_MODE (mode);
2686        wider_mode != VOIDmode;
2687        wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2688     if (optab_handler (bswap_optab, wider_mode) != CODE_FOR_nothing)
2689       goto found;
2690   return NULL_RTX;
2691
2692  found:
2693   last = get_last_insn ();
2694
2695   x = widen_operand (op0, wider_mode, mode, true, true);
2696   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2697
2698   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2699               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2700   if (x != 0)
2701     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2702                       GET_MODE_BITSIZE (wider_mode)
2703                       - GET_MODE_BITSIZE (mode),
2704                       NULL_RTX, true);
2705
2706   if (x != 0)
2707     {
2708       if (target == 0)
2709         target = gen_reg_rtx (mode);
2710       emit_move_insn (target, gen_lowpart (mode, x));
2711     }
2712   else
2713     delete_insns_since (last);
2714
2715   return target;
2716 }
2717
2718 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2719
2720 static rtx
2721 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2722 {
2723   rtx t0, t1;
2724
2725   t1 = expand_unop (word_mode, bswap_optab,
2726                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2727   t0 = expand_unop (word_mode, bswap_optab,
2728                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2729
2730   if (target == 0 || !valid_multiword_target_p (target))
2731     target = gen_reg_rtx (mode);
2732   if (REG_P (target))
2733     emit_clobber (target);
2734   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2735   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2736
2737   return target;
2738 }
2739
2740 /* Try calculating (parity x) as (and (popcount x) 1), where
2741    popcount can also be done in a wider mode.  */
2742 static rtx
2743 expand_parity (machine_mode mode, rtx op0, rtx target)
2744 {
2745   enum mode_class mclass = GET_MODE_CLASS (mode);
2746   if (CLASS_HAS_WIDER_MODES_P (mclass))
2747     {
2748       machine_mode wider_mode;
2749       for (wider_mode = mode; wider_mode != VOIDmode;
2750            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2751         {
2752           if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2753             {
2754               rtx xop0, temp;
2755               rtx_insn *last;
2756
2757               last = get_last_insn ();
2758
2759               if (target == 0)
2760                 target = gen_reg_rtx (mode);
2761               xop0 = widen_operand (op0, wider_mode, mode, true, false);
2762               temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2763                                   true);
2764               if (temp != 0)
2765                 temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2766                                      target, true, OPTAB_DIRECT);
2767               if (temp == 0)
2768                 delete_insns_since (last);
2769
2770               return temp;
2771             }
2772         }
2773     }
2774   return 0;
2775 }
2776
2777 /* Try calculating ctz(x) as K - clz(x & -x) ,
2778    where K is GET_MODE_PRECISION(mode) - 1.
2779
2780    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2781    don't have to worry about what the hardware does in that case.  (If
2782    the clz instruction produces the usual value at 0, which is K, the
2783    result of this code sequence will be -1; expand_ffs, below, relies
2784    on this.  It might be nice to have it be K instead, for consistency
2785    with the (very few) processors that provide a ctz with a defined
2786    value, but that would take one more instruction, and it would be
2787    less convenient for expand_ffs anyway.  */
2788
2789 static rtx
2790 expand_ctz (machine_mode mode, rtx op0, rtx target)
2791 {
2792   rtx_insn *seq;
2793   rtx temp;
2794
2795   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2796     return 0;
2797
2798   start_sequence ();
2799
2800   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2801   if (temp)
2802     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2803                          true, OPTAB_DIRECT);
2804   if (temp)
2805     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2806   if (temp)
2807     temp = expand_binop (mode, sub_optab,
2808                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2809                          temp, target,
2810                          true, OPTAB_DIRECT);
2811   if (temp == 0)
2812     {
2813       end_sequence ();
2814       return 0;
2815     }
2816
2817   seq = get_insns ();
2818   end_sequence ();
2819
2820   add_equal_note (seq, temp, CTZ, op0, 0);
2821   emit_insn (seq);
2822   return temp;
2823 }
2824
2825
2826 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2827    else with the sequence used by expand_clz.
2828
2829    The ffs builtin promises to return zero for a zero value and ctz/clz
2830    may have an undefined value in that case.  If they do not give us a
2831    convenient value, we have to generate a test and branch.  */
2832 static rtx
2833 expand_ffs (machine_mode mode, rtx op0, rtx target)
2834 {
2835   HOST_WIDE_INT val = 0;
2836   bool defined_at_zero = false;
2837   rtx temp;
2838   rtx_insn *seq;
2839
2840   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2841     {
2842       start_sequence ();
2843
2844       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2845       if (!temp)
2846         goto fail;
2847
2848       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2849     }
2850   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2851     {
2852       start_sequence ();
2853       temp = expand_ctz (mode, op0, 0);
2854       if (!temp)
2855         goto fail;
2856
2857       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2858         {
2859           defined_at_zero = true;
2860           val = (GET_MODE_PRECISION (mode) - 1) - val;
2861         }
2862     }
2863   else
2864     return 0;
2865
2866   if (defined_at_zero && val == -1)
2867     /* No correction needed at zero.  */;
2868   else
2869     {
2870       /* We don't try to do anything clever with the situation found
2871          on some processors (eg Alpha) where ctz(0:mode) ==
2872          bitsize(mode).  If someone can think of a way to send N to -1
2873          and leave alone all values in the range 0..N-1 (where N is a
2874          power of two), cheaper than this test-and-branch, please add it.
2875
2876          The test-and-branch is done after the operation itself, in case
2877          the operation sets condition codes that can be recycled for this.
2878          (This is true on i386, for instance.)  */
2879
2880       rtx_code_label *nonzero_label = gen_label_rtx ();
2881       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2882                                mode, true, nonzero_label);
2883
2884       convert_move (temp, GEN_INT (-1), false);
2885       emit_label (nonzero_label);
2886     }
2887
2888   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2889      to produce a value in the range 0..bitsize.  */
2890   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2891                        target, false, OPTAB_DIRECT);
2892   if (!temp)
2893     goto fail;
2894
2895   seq = get_insns ();
2896   end_sequence ();
2897
2898   add_equal_note (seq, temp, FFS, op0, 0);
2899   emit_insn (seq);
2900   return temp;
2901
2902  fail:
2903   end_sequence ();
2904   return 0;
2905 }
2906
2907 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2908    conditions, VAL may already be a SUBREG against which we cannot generate
2909    a further SUBREG.  In this case, we expect forcing the value into a
2910    register will work around the situation.  */
2911
2912 static rtx
2913 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2914                            machine_mode imode)
2915 {
2916   rtx ret;
2917   ret = lowpart_subreg (omode, val, imode);
2918   if (ret == NULL)
2919     {
2920       val = force_reg (imode, val);
2921       ret = lowpart_subreg (omode, val, imode);
2922       gcc_assert (ret != NULL);
2923     }
2924   return ret;
2925 }
2926
2927 /* Expand a floating point absolute value or negation operation via a
2928    logical operation on the sign bit.  */
2929
2930 static rtx
2931 expand_absneg_bit (enum rtx_code code, machine_mode mode,
2932                    rtx op0, rtx target)
2933 {
2934   const struct real_format *fmt;
2935   int bitpos, word, nwords, i;
2936   machine_mode imode;
2937   rtx temp;
2938   rtx_insn *insns;
2939
2940   /* The format has to have a simple sign bit.  */
2941   fmt = REAL_MODE_FORMAT (mode);
2942   if (fmt == NULL)
2943     return NULL_RTX;
2944
2945   bitpos = fmt->signbit_rw;
2946   if (bitpos < 0)
2947     return NULL_RTX;
2948
2949   /* Don't create negative zeros if the format doesn't support them.  */
2950   if (code == NEG && !fmt->has_signed_zero)
2951     return NULL_RTX;
2952
2953   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2954     {
2955       imode = int_mode_for_mode (mode);
2956       if (imode == BLKmode)
2957         return NULL_RTX;
2958       word = 0;
2959       nwords = 1;
2960     }
2961   else
2962     {
2963       imode = word_mode;
2964
2965       if (FLOAT_WORDS_BIG_ENDIAN)
2966         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2967       else
2968         word = bitpos / BITS_PER_WORD;
2969       bitpos = bitpos % BITS_PER_WORD;
2970       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2971     }
2972
2973   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2974   if (code == ABS)
2975     mask = ~mask;
2976
2977   if (target == 0
2978       || target == op0
2979       || (nwords > 1 && !valid_multiword_target_p (target)))
2980     target = gen_reg_rtx (mode);
2981
2982   if (nwords > 1)
2983     {
2984       start_sequence ();
2985
2986       for (i = 0; i < nwords; ++i)
2987         {
2988           rtx targ_piece = operand_subword (target, i, 1, mode);
2989           rtx op0_piece = operand_subword_force (op0, i, mode);
2990
2991           if (i == word)
2992             {
2993               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2994                                    op0_piece,
2995                                    immed_wide_int_const (mask, imode),
2996                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2997               if (temp != targ_piece)
2998                 emit_move_insn (targ_piece, temp);
2999             }
3000           else
3001             emit_move_insn (targ_piece, op0_piece);
3002         }
3003
3004       insns = get_insns ();
3005       end_sequence ();
3006
3007       emit_insn (insns);
3008     }
3009   else
3010     {
3011       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
3012                            gen_lowpart (imode, op0),
3013                            immed_wide_int_const (mask, imode),
3014                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3015       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3016
3017       set_dst_reg_note (get_last_insn (), REG_EQUAL,
3018                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
3019                         target);
3020     }
3021
3022   return target;
3023 }
3024
3025 /* As expand_unop, but will fail rather than attempt the operation in a
3026    different mode or with a libcall.  */
3027 static rtx
3028 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
3029              int unsignedp)
3030 {
3031   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
3032     {
3033       struct expand_operand ops[2];
3034       enum insn_code icode = optab_handler (unoptab, mode);
3035       rtx_insn *last = get_last_insn ();
3036       rtx pat;
3037
3038       create_output_operand (&ops[0], target, mode);
3039       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
3040       pat = maybe_gen_insn (icode, 2, ops);
3041       if (pat)
3042         {
3043           if (INSN_P (pat) && NEXT_INSN (as_a <rtx_insn *> (pat)) != NULL_RTX
3044               && ! add_equal_note (as_a <rtx_insn *> (pat), ops[0].value,
3045                                    optab_to_code (unoptab),
3046                                    ops[1].value, NULL_RTX))
3047             {
3048               delete_insns_since (last);
3049               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
3050             }
3051
3052           emit_insn (pat);
3053
3054           return ops[0].value;
3055         }
3056     }
3057   return 0;
3058 }
3059
3060 /* Generate code to perform an operation specified by UNOPTAB
3061    on operand OP0, with result having machine-mode MODE.
3062
3063    UNSIGNEDP is for the case where we have to widen the operands
3064    to perform the operation.  It says to use zero-extension.
3065
3066    If TARGET is nonzero, the value
3067    is generated there, if it is convenient to do so.
3068    In all cases an rtx is returned for the locus of the value;
3069    this may or may not be TARGET.  */
3070
3071 rtx
3072 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
3073              int unsignedp)
3074 {
3075   enum mode_class mclass = GET_MODE_CLASS (mode);
3076   machine_mode wider_mode;
3077   rtx temp;
3078   rtx libfunc;
3079
3080   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
3081   if (temp)
3082     return temp;
3083
3084   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
3085
3086   /* Widening (or narrowing) clz needs special treatment.  */
3087   if (unoptab == clz_optab)
3088     {
3089       temp = widen_leading (mode, op0, target, unoptab);
3090       if (temp)
3091         return temp;
3092
3093       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3094           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3095         {
3096           temp = expand_doubleword_clz (mode, op0, target);
3097           if (temp)
3098             return temp;
3099         }
3100
3101       goto try_libcall;
3102     }
3103
3104   if (unoptab == clrsb_optab)
3105     {
3106       temp = widen_leading (mode, op0, target, unoptab);
3107       if (temp)
3108         return temp;
3109       goto try_libcall;
3110     }
3111
3112   /* Widening (or narrowing) bswap needs special treatment.  */
3113   if (unoptab == bswap_optab)
3114     {
3115       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
3116          or ROTATERT.  First try these directly; if this fails, then try the
3117          obvious pair of shifts with allowed widening, as this will probably
3118          be always more efficient than the other fallback methods.  */
3119       if (mode == HImode)
3120         {
3121           rtx_insn *last;
3122           rtx temp1, temp2;
3123
3124           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
3125             {
3126               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
3127                                    unsignedp, OPTAB_DIRECT);
3128               if (temp)
3129                 return temp;
3130              }
3131
3132           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
3133             {
3134               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
3135                                    unsignedp, OPTAB_DIRECT);
3136               if (temp)
3137                 return temp;
3138             }
3139
3140           last = get_last_insn ();
3141
3142           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
3143                                 unsignedp, OPTAB_WIDEN);
3144           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
3145                                 unsignedp, OPTAB_WIDEN);
3146           if (temp1 && temp2)
3147             {
3148               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
3149                                    unsignedp, OPTAB_WIDEN);
3150               if (temp)
3151                 return temp;
3152             }
3153
3154           delete_insns_since (last);
3155         }
3156
3157       temp = widen_bswap (mode, op0, target);
3158       if (temp)
3159         return temp;
3160
3161       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3162           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3163         {
3164           temp = expand_doubleword_bswap (mode, op0, target);
3165           if (temp)
3166             return temp;
3167         }
3168
3169       goto try_libcall;
3170     }
3171
3172   if (CLASS_HAS_WIDER_MODES_P (mclass))
3173     for (wider_mode = GET_MODE_WIDER_MODE (mode);
3174          wider_mode != VOIDmode;
3175          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3176       {
3177         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
3178           {
3179             rtx xop0 = op0;
3180             rtx_insn *last = get_last_insn ();
3181
3182             /* For certain operations, we need not actually extend
3183                the narrow operand, as long as we will truncate the
3184                results to the same narrowness.  */
3185
3186             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3187                                   (unoptab == neg_optab
3188                                    || unoptab == one_cmpl_optab)
3189                                   && mclass == MODE_INT);
3190
3191             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3192                                 unsignedp);
3193
3194             if (temp)
3195               {
3196                 if (mclass != MODE_INT
3197                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
3198                   {
3199                     if (target == 0)
3200                       target = gen_reg_rtx (mode);
3201                     convert_move (target, temp, 0);
3202                     return target;
3203                   }
3204                 else
3205                   return gen_lowpart (mode, temp);
3206               }
3207             else
3208               delete_insns_since (last);
3209           }
3210       }
3211
3212   /* These can be done a word at a time.  */
3213   if (unoptab == one_cmpl_optab
3214       && mclass == MODE_INT
3215       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
3216       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3217     {
3218       int i;
3219       rtx_insn *insns;
3220
3221       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
3222         target = gen_reg_rtx (mode);
3223
3224       start_sequence ();
3225
3226       /* Do the actual arithmetic.  */
3227       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
3228         {
3229           rtx target_piece = operand_subword (target, i, 1, mode);
3230           rtx x = expand_unop (word_mode, unoptab,
3231                                operand_subword_force (op0, i, mode),
3232                                target_piece, unsignedp);
3233
3234           if (target_piece != x)
3235             emit_move_insn (target_piece, x);
3236         }
3237
3238       insns = get_insns ();
3239       end_sequence ();
3240
3241       emit_insn (insns);
3242       return target;
3243     }
3244
3245   if (optab_to_code (unoptab) == NEG)
3246     {
3247       /* Try negating floating point values by flipping the sign bit.  */
3248       if (SCALAR_FLOAT_MODE_P (mode))
3249         {
3250           temp = expand_absneg_bit (NEG, mode, op0, target);
3251           if (temp)
3252             return temp;
3253         }
3254
3255       /* If there is no negation pattern, and we have no negative zero,
3256          try subtracting from zero.  */
3257       if (!HONOR_SIGNED_ZEROS (mode))
3258         {
3259           temp = expand_binop (mode, (unoptab == negv_optab
3260                                       ? subv_optab : sub_optab),
3261                                CONST0_RTX (mode), op0, target,
3262                                unsignedp, OPTAB_DIRECT);
3263           if (temp)
3264             return temp;
3265         }
3266     }
3267
3268   /* Try calculating parity (x) as popcount (x) % 2.  */
3269   if (unoptab == parity_optab)
3270     {
3271       temp = expand_parity (mode, op0, target);
3272       if (temp)
3273         return temp;
3274     }
3275
3276   /* Try implementing ffs (x) in terms of clz (x).  */
3277   if (unoptab == ffs_optab)
3278     {
3279       temp = expand_ffs (mode, op0, target);
3280       if (temp)
3281         return temp;
3282     }
3283
3284   /* Try implementing ctz (x) in terms of clz (x).  */
3285   if (unoptab == ctz_optab)
3286     {
3287       temp = expand_ctz (mode, op0, target);
3288       if (temp)
3289         return temp;
3290     }
3291
3292  try_libcall:
3293   /* Now try a library call in this mode.  */
3294   libfunc = optab_libfunc (unoptab, mode);
3295   if (libfunc)
3296     {
3297       rtx_insn *insns;
3298       rtx value;
3299       rtx eq_value;
3300       machine_mode outmode = mode;
3301
3302       /* All of these functions return small values.  Thus we choose to
3303          have them return something that isn't a double-word.  */
3304       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3305           || unoptab == clrsb_optab || unoptab == popcount_optab
3306           || unoptab == parity_optab)
3307         outmode
3308           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3309                                           optab_libfunc (unoptab, mode)));
3310
3311       start_sequence ();
3312
3313       /* Pass 1 for NO_QUEUE so we don't lose any increments
3314          if the libcall is cse'd or moved.  */
3315       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3316                                        1, op0, mode);
3317       insns = get_insns ();
3318       end_sequence ();
3319
3320       target = gen_reg_rtx (outmode);
3321       eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3322       if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
3323         eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3324       else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
3325         eq_value = simplify_gen_unary (ZERO_EXTEND, outmode, eq_value, mode);
3326       emit_libcall_block_1 (insns, target, value, eq_value,
3327                             trapv_unoptab_p (unoptab));
3328
3329       return target;
3330     }
3331
3332   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3333
3334   if (CLASS_HAS_WIDER_MODES_P (mclass))
3335     {
3336       for (wider_mode = GET_MODE_WIDER_MODE (mode);
3337            wider_mode != VOIDmode;
3338            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3339         {
3340           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3341               || optab_libfunc (unoptab, wider_mode))
3342             {
3343               rtx xop0 = op0;
3344               rtx_insn *last = get_last_insn ();
3345
3346               /* For certain operations, we need not actually extend
3347                  the narrow operand, as long as we will truncate the
3348                  results to the same narrowness.  */
3349               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3350                                     (unoptab == neg_optab
3351                                      || unoptab == one_cmpl_optab
3352                                      || unoptab == bswap_optab)
3353                                     && mclass == MODE_INT);
3354
3355               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3356                                   unsignedp);
3357
3358               /* If we are generating clz using wider mode, adjust the
3359                  result.  Similarly for clrsb.  */
3360               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3361                   && temp != 0)
3362                 temp = expand_binop
3363                   (wider_mode, sub_optab, temp,
3364                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
3365                                  - GET_MODE_PRECISION (mode),
3366                                  wider_mode),
3367                    target, true, OPTAB_DIRECT);
3368
3369               /* Likewise for bswap.  */
3370               if (unoptab == bswap_optab && temp != 0)
3371                 {
3372                   gcc_assert (GET_MODE_PRECISION (wider_mode)
3373                               == GET_MODE_BITSIZE (wider_mode)
3374                               && GET_MODE_PRECISION (mode)
3375                                  == GET_MODE_BITSIZE (mode));
3376
3377                   temp = expand_shift (RSHIFT_EXPR, wider_mode, temp,
3378                                        GET_MODE_BITSIZE (wider_mode)
3379                                        - GET_MODE_BITSIZE (mode),
3380                                        NULL_RTX, true);
3381                 }
3382
3383               if (temp)
3384                 {
3385                   if (mclass != MODE_INT)
3386                     {
3387                       if (target == 0)
3388                         target = gen_reg_rtx (mode);
3389                       convert_move (target, temp, 0);
3390                       return target;
3391                     }
3392                   else
3393                     return gen_lowpart (mode, temp);
3394                 }
3395               else
3396                 delete_insns_since (last);
3397             }
3398         }
3399     }
3400
3401   /* One final attempt at implementing negation via subtraction,
3402      this time allowing widening of the operand.  */
3403   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3404     {
3405       rtx temp;
3406       temp = expand_binop (mode,
3407                            unoptab == negv_optab ? subv_optab : sub_optab,
3408                            CONST0_RTX (mode), op0,
3409                            target, unsignedp, OPTAB_LIB_WIDEN);
3410       if (temp)
3411         return temp;
3412     }
3413
3414   return 0;
3415 }
3416 \f
3417 /* Emit code to compute the absolute value of OP0, with result to
3418    TARGET if convenient.  (TARGET may be 0.)  The return value says
3419    where the result actually is to be found.
3420
3421    MODE is the mode of the operand; the mode of the result is
3422    different but can be deduced from MODE.
3423
3424  */
3425
3426 rtx
3427 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3428                    int result_unsignedp)
3429 {
3430   rtx temp;
3431
3432   if (GET_MODE_CLASS (mode) != MODE_INT
3433       || ! flag_trapv)
3434     result_unsignedp = 1;
3435
3436   /* First try to do it with a special abs instruction.  */
3437   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3438                       op0, target, 0);
3439   if (temp != 0)
3440     return temp;
3441
3442   /* For floating point modes, try clearing the sign bit.  */
3443   if (SCALAR_FLOAT_MODE_P (mode))
3444     {
3445       temp = expand_absneg_bit (ABS, mode, op0, target);
3446       if (temp)
3447         return temp;
3448     }
3449
3450   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3451   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3452       && !HONOR_SIGNED_ZEROS (mode))
3453     {
3454       rtx_insn *last = get_last_insn ();
3455
3456       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3457                           op0, NULL_RTX, 0);
3458       if (temp != 0)
3459         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3460                              OPTAB_WIDEN);
3461
3462       if (temp != 0)
3463         return temp;
3464
3465       delete_insns_since (last);
3466     }
3467
3468   /* If this machine has expensive jumps, we can do integer absolute
3469      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3470      where W is the width of MODE.  */
3471
3472   if (GET_MODE_CLASS (mode) == MODE_INT
3473       && BRANCH_COST (optimize_insn_for_speed_p (),
3474                       false) >= 2)
3475     {
3476       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3477                                    GET_MODE_PRECISION (mode) - 1,
3478                                    NULL_RTX, 0);
3479
3480       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3481                            OPTAB_LIB_WIDEN);
3482       if (temp != 0)
3483         temp = expand_binop (mode, result_unsignedp ? sub_optab : subv_optab,
3484                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3485
3486       if (temp != 0)
3487         return temp;
3488     }
3489
3490   return NULL_RTX;
3491 }
3492
3493 rtx
3494 expand_abs (machine_mode mode, rtx op0, rtx target,
3495             int result_unsignedp, int safe)
3496 {
3497   rtx temp;
3498   rtx_code_label *op1;
3499
3500   if (GET_MODE_CLASS (mode) != MODE_INT
3501       || ! flag_trapv)
3502     result_unsignedp = 1;
3503
3504   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3505   if (temp != 0)
3506     return temp;
3507
3508   /* If that does not win, use conditional jump and negate.  */
3509
3510   /* It is safe to use the target if it is the same
3511      as the source if this is also a pseudo register */
3512   if (op0 == target && REG_P (op0)
3513       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3514     safe = 1;
3515
3516   op1 = gen_label_rtx ();
3517   if (target == 0 || ! safe
3518       || GET_MODE (target) != mode
3519       || (MEM_P (target) && MEM_VOLATILE_P (target))
3520       || (REG_P (target)
3521           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3522     target = gen_reg_rtx (mode);
3523
3524   emit_move_insn (target, op0);
3525   NO_DEFER_POP;
3526
3527   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3528                            NULL_RTX, NULL_RTX, op1, -1);
3529
3530   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3531                      target, target, 0);
3532   if (op0 != target)
3533     emit_move_insn (target, op0);
3534   emit_label (op1);
3535   OK_DEFER_POP;
3536   return target;
3537 }
3538
3539 /* Emit code to compute the one's complement absolute value of OP0
3540    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3541    (TARGET may be NULL_RTX.)  The return value says where the result
3542    actually is to be found.
3543
3544    MODE is the mode of the operand; the mode of the result is
3545    different but can be deduced from MODE.  */
3546
3547 rtx
3548 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3549 {
3550   rtx temp;
3551
3552   /* Not applicable for floating point modes.  */
3553   if (FLOAT_MODE_P (mode))
3554     return NULL_RTX;
3555
3556   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3557   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3558     {
3559       rtx_insn *last = get_last_insn ();
3560
3561       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3562       if (temp != 0)
3563         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3564                              OPTAB_WIDEN);
3565
3566       if (temp != 0)
3567         return temp;
3568
3569       delete_insns_since (last);
3570     }
3571
3572   /* If this machine has expensive jumps, we can do one's complement
3573      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3574
3575   if (GET_MODE_CLASS (mode) == MODE_INT
3576       && BRANCH_COST (optimize_insn_for_speed_p (),
3577                      false) >= 2)
3578     {
3579       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3580                                    GET_MODE_PRECISION (mode) - 1,
3581                                    NULL_RTX, 0);
3582
3583       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3584                            OPTAB_LIB_WIDEN);
3585
3586       if (temp != 0)
3587         return temp;
3588     }
3589
3590   return NULL_RTX;
3591 }
3592
3593 /* A subroutine of expand_copysign, perform the copysign operation using the
3594    abs and neg primitives advertised to exist on the target.  The assumption
3595    is that we have a split register file, and leaving op0 in fp registers,
3596    and not playing with subregs so much, will help the register allocator.  */
3597
3598 static rtx
3599 expand_copysign_absneg (machine_mode mode, rtx op0, rtx op1, rtx target,
3600                         int bitpos, bool op0_is_abs)
3601 {
3602   machine_mode imode;
3603   enum insn_code icode;
3604   rtx sign;
3605   rtx_code_label *label;
3606
3607   if (target == op1)
3608     target = NULL_RTX;
3609
3610   /* Check if the back end provides an insn that handles signbit for the
3611      argument's mode. */
3612   icode = optab_handler (signbit_optab, mode);
3613   if (icode != CODE_FOR_nothing)
3614     {
3615       imode = insn_data[(int) icode].operand[0].mode;
3616       sign = gen_reg_rtx (imode);
3617       emit_unop_insn (icode, sign, op1, UNKNOWN);
3618     }
3619   else
3620     {
3621       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3622         {
3623           imode = int_mode_for_mode (mode);
3624           if (imode == BLKmode)
3625             return NULL_RTX;
3626           op1 = gen_lowpart (imode, op1);
3627         }
3628       else
3629         {
3630           int word;
3631
3632           imode = word_mode;
3633           if (FLOAT_WORDS_BIG_ENDIAN)
3634             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3635           else
3636             word = bitpos / BITS_PER_WORD;
3637           bitpos = bitpos % BITS_PER_WORD;
3638           op1 = operand_subword_force (op1, word, mode);
3639         }
3640
3641       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3642       sign = expand_binop (imode, and_optab, op1,
3643                            immed_wide_int_const (mask, imode),
3644                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3645     }
3646
3647   if (!op0_is_abs)
3648     {
3649       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3650       if (op0 == NULL)
3651         return NULL_RTX;
3652       target = op0;
3653     }
3654   else
3655     {
3656       if (target == NULL_RTX)
3657         target = copy_to_reg (op0);
3658       else
3659         emit_move_insn (target, op0);
3660     }
3661
3662   label = gen_label_rtx ();
3663   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3664
3665   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3666     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3667   else
3668     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3669   if (op0 != target)
3670     emit_move_insn (target, op0);
3671
3672   emit_label (label);
3673
3674   return target;
3675 }
3676
3677
3678 /* A subroutine of expand_copysign, perform the entire copysign operation
3679    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3680    is true if op0 is known to have its sign bit clear.  */
3681
3682 static rtx
3683 expand_copysign_bit (machine_mode mode, rtx op0, rtx op1, rtx target,
3684                      int bitpos, bool op0_is_abs)
3685 {
3686   machine_mode imode;
3687   int word, nwords, i;
3688   rtx temp;
3689   rtx_insn *insns;
3690
3691   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3692     {
3693       imode = int_mode_for_mode (mode);
3694       if (imode == BLKmode)
3695         return NULL_RTX;
3696       word = 0;
3697       nwords = 1;
3698     }
3699   else
3700     {
3701       imode = word_mode;
3702
3703       if (FLOAT_WORDS_BIG_ENDIAN)
3704         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3705       else
3706         word = bitpos / BITS_PER_WORD;
3707       bitpos = bitpos % BITS_PER_WORD;
3708       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3709     }
3710
3711   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3712
3713   if (target == 0
3714       || target == op0
3715       || target == op1
3716       || (nwords > 1 && !valid_multiword_target_p (target)))
3717     target = gen_reg_rtx (mode);
3718
3719   if (nwords > 1)
3720     {
3721       start_sequence ();
3722
3723       for (i = 0; i < nwords; ++i)
3724         {
3725           rtx targ_piece = operand_subword (target, i, 1, mode);
3726           rtx op0_piece = operand_subword_force (op0, i, mode);
3727
3728           if (i == word)
3729             {
3730               if (!op0_is_abs)
3731                 op0_piece
3732                   = expand_binop (imode, and_optab, op0_piece,
3733                                   immed_wide_int_const (~mask, imode),
3734                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3735               op1 = expand_binop (imode, and_optab,
3736                                   operand_subword_force (op1, i, mode),
3737                                   immed_wide_int_const (mask, imode),
3738                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3739
3740               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3741                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3742               if (temp != targ_piece)
3743                 emit_move_insn (targ_piece, temp);
3744             }
3745           else
3746             emit_move_insn (targ_piece, op0_piece);
3747         }
3748
3749       insns = get_insns ();
3750       end_sequence ();
3751
3752       emit_insn (insns);
3753     }
3754   else
3755     {
3756       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3757                           immed_wide_int_const (mask, imode),
3758                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3759
3760       op0 = gen_lowpart (imode, op0);
3761       if (!op0_is_abs)
3762         op0 = expand_binop (imode, and_optab, op0,
3763                             immed_wide_int_const (~mask, imode),
3764                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3765
3766       temp = expand_binop (imode, ior_optab, op0, op1,
3767                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3768       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3769     }
3770
3771   return target;
3772 }
3773
3774 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3775    scalar floating point mode.  Return NULL if we do not know how to
3776    expand the operation inline.  */
3777
3778 rtx
3779 expand_copysign (rtx op0, rtx op1, rtx target)
3780 {
3781   machine_mode mode = GET_MODE (op0);
3782   const struct real_format *fmt;
3783   bool op0_is_abs;
3784   rtx temp;
3785
3786   gcc_assert (SCALAR_FLOAT_MODE_P (mode));
3787   gcc_assert (GET_MODE (op1) == mode);
3788
3789   /* First try to do it with a special instruction.  */
3790   temp = expand_binop (mode, copysign_optab, op0, op1,
3791                        target, 0, OPTAB_DIRECT);
3792   if (temp)
3793     return temp;
3794
3795   fmt = REAL_MODE_FORMAT (mode);
3796   if (fmt == NULL || !fmt->has_signed_zero)
3797     return NULL_RTX;
3798
3799   op0_is_abs = false;
3800   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3801     {
3802       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3803         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3804       op0_is_abs = true;
3805     }
3806
3807   if (fmt->signbit_ro >= 0
3808       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3809           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3810               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3811     {
3812       temp = expand_copysign_absneg (mode, op0, op1, target,
3813                                      fmt->signbit_ro, op0_is_abs);
3814       if (temp)
3815         return temp;
3816     }
3817
3818   if (fmt->signbit_rw < 0)
3819     return NULL_RTX;
3820   return expand_copysign_bit (mode, op0, op1, target,
3821                               fmt->signbit_rw, op0_is_abs);
3822 }
3823 \f
3824 /* Generate an instruction whose insn-code is INSN_CODE,
3825    with two operands: an output TARGET and an input OP0.
3826    TARGET *must* be nonzero, and the output is always stored there.
3827    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3828    the value that is stored into TARGET.
3829
3830    Return false if expansion failed.  */
3831
3832 bool
3833 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3834                       enum rtx_code code)
3835 {
3836   struct expand_operand ops[2];
3837   rtx pat;
3838
3839   create_output_operand (&ops[0], target, GET_MODE (target));
3840   create_input_operand (&ops[1], op0, GET_MODE (op0));
3841   pat = maybe_gen_insn (icode, 2, ops);
3842   if (!pat)
3843     return false;
3844
3845   if (INSN_P (pat) && NEXT_INSN (as_a <rtx_insn *> (pat)) != NULL_RTX
3846       && code != UNKNOWN)
3847     add_equal_note (as_a <rtx_insn *> (pat), ops[0].value, code, ops[1].value,
3848                     NULL_RTX);
3849
3850   emit_insn (pat);
3851
3852   if (ops[0].value != target)
3853     emit_move_insn (target, ops[0].value);
3854   return true;
3855 }
3856 /* Generate an instruction whose insn-code is INSN_CODE,
3857    with two operands: an output TARGET and an input OP0.
3858    TARGET *must* be nonzero, and the output is always stored there.
3859    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3860    the value that is stored into TARGET.  */
3861
3862 void
3863 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3864 {
3865   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3866   gcc_assert (ok);
3867 }
3868 \f
3869 struct no_conflict_data
3870 {
3871   rtx target;
3872   rtx_insn *first, *insn;
3873   bool must_stay;
3874 };
3875
3876 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3877    the currently examined clobber / store has to stay in the list of
3878    insns that constitute the actual libcall block.  */
3879 static void
3880 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3881 {
3882   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3883
3884   /* If this inns directly contributes to setting the target, it must stay.  */
3885   if (reg_overlap_mentioned_p (p->target, dest))
3886     p->must_stay = true;
3887   /* If we haven't committed to keeping any other insns in the list yet,
3888      there is nothing more to check.  */
3889   else if (p->insn == p->first)
3890     return;
3891   /* If this insn sets / clobbers a register that feeds one of the insns
3892      already in the list, this insn has to stay too.  */
3893   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3894            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3895            || reg_used_between_p (dest, p->first, p->insn)
3896            /* Likewise if this insn depends on a register set by a previous
3897               insn in the list, or if it sets a result (presumably a hard
3898               register) that is set or clobbered by a previous insn.
3899               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3900               SET_DEST perform the former check on the address, and the latter
3901               check on the MEM.  */
3902            || (GET_CODE (set) == SET
3903                && (modified_in_p (SET_SRC (set), p->first)
3904                    || modified_in_p (SET_DEST (set), p->first)
3905                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3906                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3907     p->must_stay = true;
3908 }
3909
3910 \f
3911 /* Emit code to make a call to a constant function or a library call.
3912
3913    INSNS is a list containing all insns emitted in the call.
3914    These insns leave the result in RESULT.  Our block is to copy RESULT
3915    to TARGET, which is logically equivalent to EQUIV.
3916
3917    We first emit any insns that set a pseudo on the assumption that these are
3918    loading constants into registers; doing so allows them to be safely cse'ed
3919    between blocks.  Then we emit all the other insns in the block, followed by
3920    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3921    note with an operand of EQUIV.  */
3922
3923 static void
3924 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3925                       bool equiv_may_trap)
3926 {
3927   rtx final_dest = target;
3928   rtx_insn *next, *last, *insn;
3929
3930   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3931      into a MEM later.  Protect the libcall block from this change.  */
3932   if (! REG_P (target) || REG_USERVAR_P (target))
3933     target = gen_reg_rtx (GET_MODE (target));
3934
3935   /* If we're using non-call exceptions, a libcall corresponding to an
3936      operation that may trap may also trap.  */
3937   /* ??? See the comment in front of make_reg_eh_region_note.  */
3938   if (cfun->can_throw_non_call_exceptions
3939       && (equiv_may_trap || may_trap_p (equiv)))
3940     {
3941       for (insn = insns; insn; insn = NEXT_INSN (insn))
3942         if (CALL_P (insn))
3943           {
3944             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3945             if (note)
3946               {
3947                 int lp_nr = INTVAL (XEXP (note, 0));
3948                 if (lp_nr == 0 || lp_nr == INT_MIN)
3949                   remove_note (insn, note);
3950               }
3951           }
3952     }
3953   else
3954     {
3955       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3956          reg note to indicate that this call cannot throw or execute a nonlocal
3957          goto (unless there is already a REG_EH_REGION note, in which case
3958          we update it).  */
3959       for (insn = insns; insn; insn = NEXT_INSN (insn))
3960         if (CALL_P (insn))
3961           make_reg_eh_region_note_nothrow_nononlocal (insn);
3962     }
3963
3964   /* First emit all insns that set pseudos.  Remove them from the list as
3965      we go.  Avoid insns that set pseudos which were referenced in previous
3966      insns.  These can be generated by move_by_pieces, for example,
3967      to update an address.  Similarly, avoid insns that reference things
3968      set in previous insns.  */
3969
3970   for (insn = insns; insn; insn = next)
3971     {
3972       rtx set = single_set (insn);
3973
3974       next = NEXT_INSN (insn);
3975
3976       if (set != 0 && REG_P (SET_DEST (set))
3977           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3978         {
3979           struct no_conflict_data data;
3980
3981           data.target = const0_rtx;
3982           data.first = insns;
3983           data.insn = insn;
3984           data.must_stay = 0;
3985           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3986           if (! data.must_stay)
3987             {
3988               if (PREV_INSN (insn))
3989                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3990               else
3991                 insns = next;
3992
3993               if (next)
3994                 SET_PREV_INSN (next) = PREV_INSN (insn);
3995
3996               add_insn (insn);
3997             }
3998         }
3999
4000       /* Some ports use a loop to copy large arguments onto the stack.
4001          Don't move anything outside such a loop.  */
4002       if (LABEL_P (insn))
4003         break;
4004     }
4005
4006   /* Write the remaining insns followed by the final copy.  */
4007   for (insn = insns; insn; insn = next)
4008     {
4009       next = NEXT_INSN (insn);
4010
4011       add_insn (insn);
4012     }
4013
4014   last = emit_move_insn (target, result);
4015   set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
4016
4017   if (final_dest != target)
4018     emit_move_insn (final_dest, target);
4019 }
4020
4021 void
4022 emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
4023 {
4024   emit_libcall_block_1 (safe_as_a <rtx_insn *> (insns),
4025                         target, result, equiv, false);
4026 }
4027 \f
4028 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
4029    PURPOSE describes how this comparison will be used.  CODE is the rtx
4030    comparison code we will be using.
4031
4032    ??? Actually, CODE is slightly weaker than that.  A target is still
4033    required to implement all of the normal bcc operations, but not
4034    required to implement all (or any) of the unordered bcc operations.  */
4035
4036 int
4037 can_compare_p (enum rtx_code code, machine_mode mode,
4038                enum can_compare_purpose purpose)
4039 {
4040   rtx test;
4041   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
4042   do
4043     {
4044       enum insn_code icode;
4045
4046       if (purpose == ccp_jump
4047           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
4048           && insn_operand_matches (icode, 0, test))
4049         return 1;
4050       if (purpose == ccp_store_flag
4051           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
4052           && insn_operand_matches (icode, 1, test))
4053         return 1;
4054       if (purpose == ccp_cmov
4055           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
4056         return 1;
4057
4058       mode = GET_MODE_WIDER_MODE (mode);
4059       PUT_MODE (test, mode);
4060     }
4061   while (mode != VOIDmode);
4062
4063   return 0;
4064 }
4065
4066 /* This function is called when we are going to emit a compare instruction that
4067    compares the values found in *PX and *PY, using the rtl operator COMPARISON.
4068
4069    *PMODE is the mode of the inputs (in case they are const_int).
4070    *PUNSIGNEDP nonzero says that the operands are unsigned;
4071    this matters if they need to be widened (as given by METHODS).
4072
4073    If they have mode BLKmode, then SIZE specifies the size of both operands.
4074
4075    This function performs all the setup necessary so that the caller only has
4076    to emit a single comparison insn.  This setup can involve doing a BLKmode
4077    comparison or emitting a library call to perform the comparison if no insn
4078    is available to handle it.
4079    The values which are passed in through pointers can be modified; the caller
4080    should perform the comparison on the modified values.  Constant
4081    comparisons must have already been folded.  */
4082
4083 static void
4084 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
4085                   int unsignedp, enum optab_methods methods,
4086                   rtx *ptest, machine_mode *pmode)
4087 {
4088   machine_mode mode = *pmode;
4089   rtx libfunc, test;
4090   machine_mode cmp_mode;
4091   enum mode_class mclass;
4092
4093   /* The other methods are not needed.  */
4094   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
4095               || methods == OPTAB_LIB_WIDEN);
4096
4097   /* If we are optimizing, force expensive constants into a register.  */
4098   if (CONSTANT_P (x) && optimize
4099       && (rtx_cost (x, COMPARE, 0, optimize_insn_for_speed_p ())
4100           > COSTS_N_INSNS (1)))
4101     x = force_reg (mode, x);
4102
4103   if (CONSTANT_P (y) && optimize
4104       && (rtx_cost (y, COMPARE, 1, optimize_insn_for_speed_p ())
4105           > COSTS_N_INSNS (1)))
4106     y = force_reg (mode, y);
4107
4108 #ifdef HAVE_cc0
4109   /* Make sure if we have a canonical comparison.  The RTL
4110      documentation states that canonical comparisons are required only
4111      for targets which have cc0.  */
4112   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
4113 #endif
4114
4115   /* Don't let both operands fail to indicate the mode.  */
4116   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
4117     x = force_reg (mode, x);
4118   if (mode == VOIDmode)
4119     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
4120
4121   /* Handle all BLKmode compares.  */
4122
4123   if (mode == BLKmode)
4124     {
4125       machine_mode result_mode;
4126       enum insn_code cmp_code;
4127       tree length_type;
4128       rtx libfunc;
4129       rtx result;
4130       rtx opalign
4131         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
4132
4133       gcc_assert (size);
4134
4135       /* Try to use a memory block compare insn - either cmpstr
4136          or cmpmem will do.  */
4137       for (cmp_mode = GET_CLASS_NARROWEST_MODE (MODE_INT);
4138            cmp_mode != VOIDmode;
4139            cmp_mode = GET_MODE_WIDER_MODE (cmp_mode))
4140         {
4141           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
4142           if (cmp_code == CODE_FOR_nothing)
4143             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
4144           if (cmp_code == CODE_FOR_nothing)
4145             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
4146           if (cmp_code == CODE_FOR_nothing)
4147             continue;
4148
4149           /* Must make sure the size fits the insn's mode.  */
4150           if ((CONST_INT_P (size)
4151                && INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode)))
4152               || (GET_MODE_BITSIZE (GET_MODE (size))
4153                   > GET_MODE_BITSIZE (cmp_mode)))
4154             continue;
4155
4156           result_mode = insn_data[cmp_code].operand[0].mode;
4157           result = gen_reg_rtx (result_mode);
4158           size = convert_to_mode (cmp_mode, size, 1);
4159           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
4160
4161           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
4162           *pmode = result_mode;
4163           return;
4164         }
4165
4166       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
4167         goto fail;
4168
4169       /* Otherwise call a library function, memcmp.  */
4170       libfunc = memcmp_libfunc;
4171       length_type = sizetype;
4172       result_mode = TYPE_MODE (integer_type_node);
4173       cmp_mode = TYPE_MODE (length_type);
4174       size = convert_to_mode (TYPE_MODE (length_type), size,
4175                               TYPE_UNSIGNED (length_type));
4176
4177       result = emit_library_call_value (libfunc, 0, LCT_PURE,
4178                                         result_mode, 3,
4179                                         XEXP (x, 0), Pmode,
4180                                         XEXP (y, 0), Pmode,
4181                                         size, cmp_mode);
4182       x = result;
4183       y = const0_rtx;
4184       mode = result_mode;
4185       methods = OPTAB_LIB_WIDEN;
4186       unsignedp = false;
4187     }
4188
4189   /* Don't allow operands to the compare to trap, as that can put the
4190      compare and branch in different basic blocks.  */
4191   if (cfun->can_throw_non_call_exceptions)
4192     {
4193       if (may_trap_p (x))
4194         x = force_reg (mode, x);
4195       if (may_trap_p (y))
4196         y = force_reg (mode, y);
4197     }
4198
4199   if (GET_MODE_CLASS (mode) == MODE_CC)
4200     {
4201       gcc_assert (can_compare_p (comparison, CCmode, ccp_jump));
4202       *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4203       return;
4204     }
4205
4206   mclass = GET_MODE_CLASS (mode);
4207   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4208   cmp_mode = mode;
4209   do
4210    {
4211       enum insn_code icode;
4212       icode = optab_handler (cbranch_optab, cmp_mode);
4213       if (icode != CODE_FOR_nothing
4214           && insn_operand_matches (icode, 0, test))
4215         {
4216           rtx_insn *last = get_last_insn ();
4217           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
4218           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
4219           if (op0 && op1
4220               && insn_operand_matches (icode, 1, op0)
4221               && insn_operand_matches (icode, 2, op1))
4222             {
4223               XEXP (test, 0) = op0;
4224               XEXP (test, 1) = op1;
4225               *ptest = test;
4226               *pmode = cmp_mode;
4227               return;
4228             }
4229           delete_insns_since (last);
4230         }
4231
4232       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
4233         break;
4234       cmp_mode = GET_MODE_WIDER_MODE (cmp_mode);
4235     }
4236   while (cmp_mode != VOIDmode);
4237
4238   if (methods != OPTAB_LIB_WIDEN)
4239     goto fail;
4240
4241   if (!SCALAR_FLOAT_MODE_P (mode))
4242     {
4243       rtx result;
4244       machine_mode ret_mode;
4245
4246       /* Handle a libcall just for the mode we are using.  */
4247       libfunc = optab_libfunc (cmp_optab, mode);
4248       gcc_assert (libfunc);
4249
4250       /* If we want unsigned, and this mode has a distinct unsigned
4251          comparison routine, use that.  */
4252       if (unsignedp)
4253         {
4254           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
4255           if (ulibfunc)
4256             libfunc = ulibfunc;
4257         }
4258
4259       ret_mode = targetm.libgcc_cmp_return_mode ();
4260       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4261                                         ret_mode, 2, x, mode, y, mode);
4262
4263       /* There are two kinds of comparison routines. Biased routines
4264          return 0/1/2, and unbiased routines return -1/0/1. Other parts
4265          of gcc expect that the comparison operation is equivalent
4266          to the modified comparison. For signed comparisons compare the
4267          result against 1 in the biased case, and zero in the unbiased
4268          case. For unsigned comparisons always compare against 1 after
4269          biasing the unbiased result by adding 1. This gives us a way to
4270          represent LTU.
4271          The comparisons in the fixed-point helper library are always
4272          biased.  */
4273       x = result;
4274       y = const1_rtx;
4275
4276       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4277         {
4278           if (unsignedp)
4279             x = plus_constant (ret_mode, result, 1);
4280           else
4281             y = const0_rtx;
4282         }
4283
4284       *pmode = ret_mode;
4285       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4286                         ptest, pmode);
4287     }
4288   else
4289     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
4290
4291   return;
4292
4293  fail:
4294   *ptest = NULL_RTX;
4295 }
4296
4297 /* Before emitting an insn with code ICODE, make sure that X, which is going
4298    to be used for operand OPNUM of the insn, is converted from mode MODE to
4299    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4300    that it is accepted by the operand predicate.  Return the new value.  */
4301
4302 rtx
4303 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4304                  machine_mode wider_mode, int unsignedp)
4305 {
4306   if (mode != wider_mode)
4307     x = convert_modes (wider_mode, mode, x, unsignedp);
4308
4309   if (!insn_operand_matches (icode, opnum, x))
4310     {
4311       if (reload_completed)
4312         return NULL_RTX;
4313       x = copy_to_mode_reg (insn_data[(int) icode].operand[opnum].mode, x);
4314     }
4315
4316   return x;
4317 }
4318
4319 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4320    we can do the branch.  */
4321
4322 static void
4323 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label, int prob)
4324 {
4325   machine_mode optab_mode;
4326   enum mode_class mclass;
4327   enum insn_code icode;
4328   rtx_insn *insn;
4329
4330   mclass = GET_MODE_CLASS (mode);
4331   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4332   icode = optab_handler (cbranch_optab, optab_mode);
4333
4334   gcc_assert (icode != CODE_FOR_nothing);
4335   gcc_assert (insn_operand_matches (icode, 0, test));
4336   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4337                                           XEXP (test, 1), label));
4338   if (prob != -1
4339       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4340       && insn
4341       && JUMP_P (insn)
4342       && any_condjump_p (insn)
4343       && !find_reg_note (insn, REG_BR_PROB, 0))
4344     add_int_reg_note (insn, REG_BR_PROB, prob);
4345 }
4346
4347 /* Generate code to compare X with Y so that the condition codes are
4348    set and to jump to LABEL if the condition is true.  If X is a
4349    constant and Y is not a constant, then the comparison is swapped to
4350    ensure that the comparison RTL has the canonical form.
4351
4352    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4353    need to be widened.  UNSIGNEDP is also used to select the proper
4354    branch condition code.
4355
4356    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4357
4358    MODE is the mode of the inputs (in case they are const_int).
4359
4360    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4361    It will be potentially converted into an unsigned variant based on
4362    UNSIGNEDP to select a proper jump instruction.
4363
4364    PROB is the probability of jumping to LABEL.  */
4365
4366 void
4367 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4368                          machine_mode mode, int unsignedp, rtx label,
4369                          int prob)
4370 {
4371   rtx op0 = x, op1 = y;
4372   rtx test;
4373
4374   /* Swap operands and condition to ensure canonical RTL.  */
4375   if (swap_commutative_operands_p (x, y)
4376       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4377     {
4378       op0 = y, op1 = x;
4379       comparison = swap_condition (comparison);
4380     }
4381
4382   /* If OP0 is still a constant, then both X and Y must be constants
4383      or the opposite comparison is not supported.  Force X into a register
4384      to create canonical RTL.  */
4385   if (CONSTANT_P (op0))
4386     op0 = force_reg (mode, op0);
4387
4388   if (unsignedp)
4389     comparison = unsigned_condition (comparison);
4390
4391   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4392                     &test, &mode);
4393   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4394 }
4395
4396 \f
4397 /* Emit a library call comparison between floating point X and Y.
4398    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4399
4400 static void
4401 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4402                        rtx *ptest, machine_mode *pmode)
4403 {
4404   enum rtx_code swapped = swap_condition (comparison);
4405   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4406   machine_mode orig_mode = GET_MODE (x);
4407   machine_mode mode, cmp_mode;
4408   rtx true_rtx, false_rtx;
4409   rtx value, target, equiv;
4410   rtx_insn *insns;
4411   rtx libfunc = 0;
4412   bool reversed_p = false;
4413   cmp_mode = targetm.libgcc_cmp_return_mode ();
4414
4415   for (mode = orig_mode;
4416        mode != VOIDmode;
4417        mode = GET_MODE_WIDER_MODE (mode))
4418     {
4419       if (code_to_optab (comparison)
4420           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4421         break;
4422
4423       if (code_to_optab (swapped)
4424           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4425         {
4426           rtx tmp;
4427           tmp = x; x = y; y = tmp;
4428           comparison = swapped;
4429           break;
4430         }
4431
4432       if (code_to_optab (reversed)
4433           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4434         {
4435           comparison = reversed;
4436           reversed_p = true;
4437           break;
4438         }
4439     }
4440
4441   gcc_assert (mode != VOIDmode);
4442
4443   if (mode != orig_mode)
4444     {
4445       x = convert_to_mode (mode, x, 0);
4446       y = convert_to_mode (mode, y, 0);
4447     }
4448
4449   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4450      the RTL.  The allows the RTL optimizers to delete the libcall if the
4451      condition can be determined at compile-time.  */
4452   if (comparison == UNORDERED
4453       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4454     {
4455       true_rtx = const_true_rtx;
4456       false_rtx = const0_rtx;
4457     }
4458   else
4459     {
4460       switch (comparison)
4461         {
4462         case EQ:
4463           true_rtx = const0_rtx;
4464           false_rtx = const_true_rtx;
4465           break;
4466
4467         case NE:
4468           true_rtx = const_true_rtx;
4469           false_rtx = const0_rtx;
4470           break;
4471
4472         case GT:
4473           true_rtx = const1_rtx;
4474           false_rtx = const0_rtx;
4475           break;
4476
4477         case GE:
4478           true_rtx = const0_rtx;
4479           false_rtx = constm1_rtx;
4480           break;
4481
4482         case LT:
4483           true_rtx = constm1_rtx;
4484           false_rtx = const0_rtx;
4485           break;
4486
4487         case LE:
4488           true_rtx = const0_rtx;
4489           false_rtx = const1_rtx;
4490           break;
4491
4492         default:
4493           gcc_unreachable ();
4494         }
4495     }
4496
4497   if (comparison == UNORDERED)
4498     {
4499       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4500       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4501       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4502                                     temp, const_true_rtx, equiv);
4503     }
4504   else
4505     {
4506       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4507       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4508         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4509                                       equiv, true_rtx, false_rtx);
4510     }
4511
4512   start_sequence ();
4513   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4514                                    cmp_mode, 2, x, mode, y, mode);
4515   insns = get_insns ();
4516   end_sequence ();
4517
4518   target = gen_reg_rtx (cmp_mode);
4519   emit_libcall_block (insns, target, value, equiv);
4520
4521   if (comparison == UNORDERED
4522       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4523       || reversed_p)
4524     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4525   else
4526     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4527
4528   *pmode = cmp_mode;
4529 }
4530 \f
4531 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4532
4533 void
4534 emit_indirect_jump (rtx loc)
4535 {
4536   struct expand_operand ops[1];
4537
4538   create_address_operand (&ops[0], loc);
4539   expand_jump_insn (CODE_FOR_indirect_jump, 1, ops);
4540   emit_barrier ();
4541 }
4542 \f
4543 #ifdef HAVE_conditional_move
4544
4545 /* Emit a conditional move instruction if the machine supports one for that
4546    condition and machine mode.
4547
4548    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4549    the mode to use should they be constants.  If it is VOIDmode, they cannot
4550    both be constants.
4551
4552    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4553    should be stored there.  MODE is the mode to use should they be constants.
4554    If it is VOIDmode, they cannot both be constants.
4555
4556    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4557    is not supported.  */
4558
4559 rtx
4560 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4561                        machine_mode cmode, rtx op2, rtx op3,
4562                        machine_mode mode, int unsignedp)
4563 {
4564   rtx tem, comparison;
4565   rtx_insn *last;
4566   enum insn_code icode;
4567   enum rtx_code reversed;
4568
4569   /* If one operand is constant, make it the second one.  Only do this
4570      if the other operand is not constant as well.  */
4571
4572   if (swap_commutative_operands_p (op0, op1))
4573     {
4574       tem = op0;
4575       op0 = op1;
4576       op1 = tem;
4577       code = swap_condition (code);
4578     }
4579
4580   /* get_condition will prefer to generate LT and GT even if the old
4581      comparison was against zero, so undo that canonicalization here since
4582      comparisons against zero are cheaper.  */
4583   if (code == LT && op1 == const1_rtx)
4584     code = LE, op1 = const0_rtx;
4585   else if (code == GT && op1 == constm1_rtx)
4586     code = GE, op1 = const0_rtx;
4587
4588   if (cmode == VOIDmode)
4589     cmode = GET_MODE (op0);
4590
4591   if (swap_commutative_operands_p (op2, op3)
4592       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4593           != UNKNOWN))
4594     {
4595       tem = op2;
4596       op2 = op3;
4597       op3 = tem;
4598       code = reversed;
4599     }
4600
4601   if (mode == VOIDmode)
4602     mode = GET_MODE (op2);
4603
4604   icode = direct_optab_handler (movcc_optab, mode);
4605
4606   if (icode == CODE_FOR_nothing)
4607     return 0;
4608
4609   if (!target)
4610     target = gen_reg_rtx (mode);
4611
4612   code = unsignedp ? unsigned_condition (code) : code;
4613   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4614
4615   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4616      return NULL and let the caller figure out how best to deal with this
4617      situation.  */
4618   if (!COMPARISON_P (comparison))
4619     return NULL_RTX;
4620
4621   saved_pending_stack_adjust save;
4622   save_pending_stack_adjust (&save);
4623   last = get_last_insn ();
4624   do_pending_stack_adjust ();
4625   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4626                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4627                     &comparison, &cmode);
4628   if (comparison)
4629     {
4630       struct expand_operand ops[4];
4631
4632       create_output_operand (&ops[0], target, mode);
4633       create_fixed_operand (&ops[1], comparison);
4634       create_input_operand (&ops[2], op2, mode);
4635       create_input_operand (&ops[3], op3, mode);
4636       if (maybe_expand_insn (icode, 4, ops))
4637         {
4638           if (ops[0].value != target)
4639             convert_move (target, ops[0].value, false);
4640           return target;
4641         }
4642     }
4643   delete_insns_since (last);
4644   restore_pending_stack_adjust (&save);
4645   return NULL_RTX;
4646 }
4647
4648 /* Return nonzero if a conditional move of mode MODE is supported.
4649
4650    This function is for combine so it can tell whether an insn that looks
4651    like a conditional move is actually supported by the hardware.  If we
4652    guess wrong we lose a bit on optimization, but that's it.  */
4653 /* ??? sparc64 supports conditionally moving integers values based on fp
4654    comparisons, and vice versa.  How do we handle them?  */
4655
4656 int
4657 can_conditionally_move_p (machine_mode mode)
4658 {
4659   if (direct_optab_handler (movcc_optab, mode) != CODE_FOR_nothing)
4660     return 1;
4661
4662   return 0;
4663 }
4664
4665 #endif /* HAVE_conditional_move */
4666
4667 /* Emit a conditional addition instruction if the machine supports one for that
4668    condition and machine mode.
4669
4670    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4671    the mode to use should they be constants.  If it is VOIDmode, they cannot
4672    both be constants.
4673
4674    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4675    should be stored there.  MODE is the mode to use should they be constants.
4676    If it is VOIDmode, they cannot both be constants.
4677
4678    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4679    is not supported.  */
4680
4681 rtx
4682 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4683                       machine_mode cmode, rtx op2, rtx op3,
4684                       machine_mode mode, int unsignedp)
4685 {
4686   rtx tem, comparison;
4687   rtx_insn *last;
4688   enum insn_code icode;
4689
4690   /* If one operand is constant, make it the second one.  Only do this
4691      if the other operand is not constant as well.  */
4692
4693   if (swap_commutative_operands_p (op0, op1))
4694     {
4695       tem = op0;
4696       op0 = op1;
4697       op1 = tem;
4698       code = swap_condition (code);
4699     }
4700
4701   /* get_condition will prefer to generate LT and GT even if the old
4702      comparison was against zero, so undo that canonicalization here since
4703      comparisons against zero are cheaper.  */
4704   if (code == LT && op1 == const1_rtx)
4705     code = LE, op1 = const0_rtx;
4706   else if (code == GT && op1 == constm1_rtx)
4707     code = GE, op1 = const0_rtx;
4708
4709   if (cmode == VOIDmode)
4710     cmode = GET_MODE (op0);
4711
4712   if (mode == VOIDmode)
4713     mode = GET_MODE (op2);
4714
4715   icode = optab_handler (addcc_optab, mode);
4716
4717   if (icode == CODE_FOR_nothing)
4718     return 0;
4719
4720   if (!target)
4721     target = gen_reg_rtx (mode);
4722
4723   code = unsignedp ? unsigned_condition (code) : code;
4724   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4725
4726   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4727      return NULL and let the caller figure out how best to deal with this
4728      situation.  */
4729   if (!COMPARISON_P (comparison))
4730     return NULL_RTX;
4731
4732   do_pending_stack_adjust ();
4733   last = get_last_insn ();
4734   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4735                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4736                     &comparison, &cmode);
4737   if (comparison)
4738     {
4739       struct expand_operand ops[4];
4740
4741       create_output_operand (&ops[0], target, mode);
4742       create_fixed_operand (&ops[1], comparison);
4743       create_input_operand (&ops[2], op2, mode);
4744       create_input_operand (&ops[3], op3, mode);
4745       if (maybe_expand_insn (icode, 4, ops))
4746         {
4747           if (ops[0].value != target)
4748             convert_move (target, ops[0].value, false);
4749           return target;
4750         }
4751     }
4752   delete_insns_since (last);
4753   return NULL_RTX;
4754 }
4755 \f
4756 /* These functions attempt to generate an insn body, rather than
4757    emitting the insn, but if the gen function already emits them, we
4758    make no attempt to turn them back into naked patterns.  */
4759
4760 /* Generate and return an insn body to add Y to X.  */
4761
4762 rtx
4763 gen_add2_insn (rtx x, rtx y)
4764 {
4765   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4766
4767   gcc_assert (insn_operand_matches (icode, 0, x));
4768   gcc_assert (insn_operand_matches (icode, 1, x));
4769   gcc_assert (insn_operand_matches (icode, 2, y));
4770
4771   return GEN_FCN (icode) (x, x, y);
4772 }
4773
4774 /* Generate and return an insn body to add r1 and c,
4775    storing the result in r0.  */
4776
4777 rtx
4778 gen_add3_insn (rtx r0, rtx r1, rtx c)
4779 {
4780   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4781
4782   if (icode == CODE_FOR_nothing
4783       || !insn_operand_matches (icode, 0, r0)
4784       || !insn_operand_matches (icode, 1, r1)
4785       || !insn_operand_matches (icode, 2, c))
4786     return NULL_RTX;
4787
4788   return GEN_FCN (icode) (r0, r1, c);
4789 }
4790
4791 int
4792 have_add2_insn (rtx x, rtx y)
4793 {
4794   enum insn_code icode;
4795
4796   gcc_assert (GET_MODE (x) != VOIDmode);
4797
4798   icode = optab_handler (add_optab, GET_MODE (x));
4799
4800   if (icode == CODE_FOR_nothing)
4801     return 0;
4802
4803   if (!insn_operand_matches (icode, 0, x)
4804       || !insn_operand_matches (icode, 1, x)
4805       || !insn_operand_matches (icode, 2, y))
4806     return 0;
4807
4808   return 1;
4809 }
4810
4811 /* Generate and return an insn body to add Y to X.  */
4812
4813 rtx
4814 gen_addptr3_insn (rtx x, rtx y, rtx z)
4815 {
4816   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4817
4818   gcc_assert (insn_operand_matches (icode, 0, x));
4819   gcc_assert (insn_operand_matches (icode, 1, y));
4820   gcc_assert (insn_operand_matches (icode, 2, z));
4821
4822   return GEN_FCN (icode) (x, y, z);
4823 }
4824
4825 /* Return true if the target implements an addptr pattern and X, Y,
4826    and Z are valid for the pattern predicates.  */
4827
4828 int
4829 have_addptr3_insn (rtx x, rtx y, rtx z)
4830 {
4831   enum insn_code icode;
4832
4833   gcc_assert (GET_MODE (x) != VOIDmode);
4834
4835   icode = optab_handler (addptr3_optab, GET_MODE (x));
4836
4837   if (icode == CODE_FOR_nothing)
4838     return 0;
4839
4840   if (!insn_operand_matches (icode, 0, x)
4841       || !insn_operand_matches (icode, 1, y)
4842       || !insn_operand_matches (icode, 2, z))
4843     return 0;
4844
4845   return 1;
4846 }
4847
4848 /* Generate and return an insn body to subtract Y from X.  */
4849
4850 rtx
4851 gen_sub2_insn (rtx x, rtx y)
4852 {
4853   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4854
4855   gcc_assert (insn_operand_matches (icode, 0, x));
4856   gcc_assert (insn_operand_matches (icode, 1, x));
4857   gcc_assert (insn_operand_matches (icode, 2, y));
4858
4859   return GEN_FCN (icode) (x, x, y);
4860 }
4861
4862 /* Generate and return an insn body to subtract r1 and c,
4863    storing the result in r0.  */
4864
4865 rtx
4866 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4867 {
4868   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4869
4870   if (icode == CODE_FOR_nothing
4871       || !insn_operand_matches (icode, 0, r0)
4872       || !insn_operand_matches (icode, 1, r1)
4873       || !insn_operand_matches (icode, 2, c))
4874     return NULL_RTX;
4875
4876   return GEN_FCN (icode) (r0, r1, c);
4877 }
4878
4879 int
4880 have_sub2_insn (rtx x, rtx y)
4881 {
4882   enum insn_code icode;
4883
4884   gcc_assert (GET_MODE (x) != VOIDmode);
4885
4886   icode = optab_handler (sub_optab, GET_MODE (x));
4887
4888   if (icode == CODE_FOR_nothing)
4889     return 0;
4890
4891   if (!insn_operand_matches (icode, 0, x)
4892       || !insn_operand_matches (icode, 1, x)
4893       || !insn_operand_matches (icode, 2, y))
4894     return 0;
4895
4896   return 1;
4897 }
4898 \f
4899 /* Return the insn code used to extend FROM_MODE to TO_MODE.
4900    UNSIGNEDP specifies zero-extension instead of sign-extension.  If
4901    no such operation exists, CODE_FOR_nothing will be returned.  */
4902
4903 enum insn_code
4904 can_extend_p (machine_mode to_mode, machine_mode from_mode,
4905               int unsignedp)
4906 {
4907   convert_optab tab;
4908 #ifdef HAVE_ptr_extend
4909   if (unsignedp < 0)
4910     return CODE_FOR_ptr_extend;
4911 #endif
4912
4913   tab = unsignedp ? zext_optab : sext_optab;
4914   return convert_optab_handler (tab, to_mode, from_mode);
4915 }
4916
4917 /* Generate the body of an insn to extend Y (with mode MFROM)
4918    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4919
4920 rtx
4921 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4922                  machine_mode mfrom, int unsignedp)
4923 {
4924   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4925   return GEN_FCN (icode) (x, y);
4926 }
4927 \f
4928 /* can_fix_p and can_float_p say whether the target machine
4929    can directly convert a given fixed point type to
4930    a given floating point type, or vice versa.
4931    The returned value is the CODE_FOR_... value to use,
4932    or CODE_FOR_nothing if these modes cannot be directly converted.
4933
4934    *TRUNCP_PTR is set to 1 if it is necessary to output
4935    an explicit FTRUNC insn before the fix insn; otherwise 0.  */
4936
4937 static enum insn_code
4938 can_fix_p (machine_mode fixmode, machine_mode fltmode,
4939            int unsignedp, int *truncp_ptr)
4940 {
4941   convert_optab tab;
4942   enum insn_code icode;
4943
4944   tab = unsignedp ? ufixtrunc_optab : sfixtrunc_optab;
4945   icode = convert_optab_handler (tab, fixmode, fltmode);
4946   if (icode != CODE_FOR_nothing)
4947     {
4948       *truncp_ptr = 0;
4949       return icode;
4950     }
4951
4952   /* FIXME: This requires a port to define both FIX and FTRUNC pattern
4953      for this to work. We need to rework the fix* and ftrunc* patterns
4954      and documentation.  */
4955   tab = unsignedp ? ufix_optab : sfix_optab;
4956   icode = convert_optab_handler (tab, fixmode, fltmode);
4957   if (icode != CODE_FOR_nothing
4958       && optab_handler (ftrunc_optab, fltmode) != CODE_FOR_nothing)
4959     {
4960       *truncp_ptr = 1;
4961       return icode;
4962     }
4963
4964   *truncp_ptr = 0;
4965   return CODE_FOR_nothing;
4966 }
4967
4968 enum insn_code
4969 can_float_p (machine_mode fltmode, machine_mode fixmode,
4970              int unsignedp)
4971 {
4972   convert_optab tab;
4973
4974   tab = unsignedp ? ufloat_optab : sfloat_optab;
4975   return convert_optab_handler (tab, fltmode, fixmode);
4976 }
4977
4978 /* Function supportable_convert_operation
4979
4980    Check whether an operation represented by the code CODE is a
4981    convert operation that is supported by the target platform in
4982    vector form (i.e., when operating on arguments of type VECTYPE_IN
4983    producing a result of type VECTYPE_OUT).
4984
4985    Convert operations we currently support directly are FIX_TRUNC and FLOAT.
4986    This function checks if these operations are supported
4987    by the target platform either directly (via vector tree-codes), or via
4988    target builtins.
4989
4990    Output:
4991    - CODE1 is code of vector operation to be used when
4992    vectorizing the operation, if available.
4993    - DECL is decl of target builtin functions to be used
4994    when vectorizing the operation, if available.  In this case,
4995    CODE1 is CALL_EXPR.  */
4996
4997 bool
4998 supportable_convert_operation (enum tree_code code,
4999                                     tree vectype_out, tree vectype_in,
5000                                     tree *decl, enum tree_code *code1)
5001 {
5002   machine_mode m1,m2;
5003   int truncp;
5004
5005   m1 = TYPE_MODE (vectype_out);
5006   m2 = TYPE_MODE (vectype_in);
5007
5008   /* First check if we can done conversion directly.  */
5009   if ((code == FIX_TRUNC_EXPR
5010        && can_fix_p (m1,m2,TYPE_UNSIGNED (vectype_out), &truncp)
5011           != CODE_FOR_nothing)
5012       || (code == FLOAT_EXPR
5013           && can_float_p (m1,m2,TYPE_UNSIGNED (vectype_in))
5014              != CODE_FOR_nothing))
5015     {
5016       *code1 = code;
5017       return true;
5018     }
5019
5020   /* Now check for builtin.  */
5021   if (targetm.vectorize.builtin_conversion
5022       && targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in))
5023     {
5024       *code1 = CALL_EXPR;
5025       *decl = targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in);
5026       return true;
5027     }
5028   return false;
5029 }
5030
5031 \f
5032 /* Generate code to convert FROM to floating point
5033    and store in TO.  FROM must be fixed point and not VOIDmode.
5034    UNSIGNEDP nonzero means regard FROM as unsigned.
5035    Normally this is done by correcting the final value
5036    if it is negative.  */
5037
5038 void
5039 expand_float (rtx to, rtx from, int unsignedp)
5040 {
5041   enum insn_code icode;
5042   rtx target = to;
5043   machine_mode fmode, imode;
5044   bool can_do_signed = false;
5045
5046   /* Crash now, because we won't be able to decide which mode to use.  */
5047   gcc_assert (GET_MODE (from) != VOIDmode);
5048
5049   /* Look for an insn to do the conversion.  Do it in the specified
5050      modes if possible; otherwise convert either input, output or both to
5051      wider mode.  If the integer mode is wider than the mode of FROM,
5052      we can do the conversion signed even if the input is unsigned.  */
5053
5054   for (fmode = GET_MODE (to); fmode != VOIDmode;
5055        fmode = GET_MODE_WIDER_MODE (fmode))
5056     for (imode = GET_MODE (from); imode != VOIDmode;
5057          imode = GET_MODE_WIDER_MODE (imode))
5058       {
5059         int doing_unsigned = unsignedp;
5060
5061         if (fmode != GET_MODE (to)
5062             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
5063           continue;
5064
5065         icode = can_float_p (fmode, imode, unsignedp);
5066         if (icode == CODE_FOR_nothing && unsignedp)
5067           {
5068             enum insn_code scode = can_float_p (fmode, imode, 0);
5069             if (scode != CODE_FOR_nothing)
5070               can_do_signed = true;
5071             if (imode != GET_MODE (from))
5072               icode = scode, doing_unsigned = 0;
5073           }
5074
5075         if (icode != CODE_FOR_nothing)
5076           {
5077             if (imode != GET_MODE (from))
5078               from = convert_to_mode (imode, from, unsignedp);
5079
5080             if (fmode != GET_MODE (to))
5081               target = gen_reg_rtx (fmode);
5082
5083             emit_unop_insn (icode, target, from,
5084                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
5085
5086             if (target != to)
5087               convert_move (to, target, 0);
5088             return;
5089           }
5090       }
5091
5092   /* Unsigned integer, and no way to convert directly.  Convert as signed,
5093      then unconditionally adjust the result.  */
5094   if (unsignedp && can_do_signed)
5095     {
5096       rtx_code_label *label = gen_label_rtx ();
5097       rtx temp;
5098       REAL_VALUE_TYPE offset;
5099
5100       /* Look for a usable floating mode FMODE wider than the source and at
5101          least as wide as the target.  Using FMODE will avoid rounding woes
5102          with unsigned values greater than the signed maximum value.  */
5103
5104       for (fmode = GET_MODE (to);  fmode != VOIDmode;
5105            fmode = GET_MODE_WIDER_MODE (fmode))
5106         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
5107             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
5108           break;
5109
5110       if (fmode == VOIDmode)
5111         {
5112           /* There is no such mode.  Pretend the target is wide enough.  */
5113           fmode = GET_MODE (to);
5114
5115           /* Avoid double-rounding when TO is narrower than FROM.  */
5116           if ((significand_size (fmode) + 1)
5117               < GET_MODE_PRECISION (GET_MODE (from)))
5118             {
5119               rtx temp1;
5120               rtx_code_label *neglabel = gen_label_rtx ();
5121
5122               /* Don't use TARGET if it isn't a register, is a hard register,
5123                  or is the wrong mode.  */
5124               if (!REG_P (target)
5125                   || REGNO (target) < FIRST_PSEUDO_REGISTER
5126                   || GET_MODE (target) != fmode)
5127                 target = gen_reg_rtx (fmode);
5128
5129               imode = GET_MODE (from);
5130               do_pending_stack_adjust ();
5131
5132               /* Test whether the sign bit is set.  */
5133               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
5134                                        0, neglabel);
5135
5136               /* The sign bit is not set.  Convert as signed.  */
5137               expand_float (target, from, 0);
5138               emit_jump_insn (gen_jump (label));
5139               emit_barrier ();
5140
5141               /* The sign bit is set.
5142                  Convert to a usable (positive signed) value by shifting right
5143                  one bit, while remembering if a nonzero bit was shifted
5144                  out; i.e., compute  (from & 1) | (from >> 1).  */
5145
5146               emit_label (neglabel);
5147               temp = expand_binop (imode, and_optab, from, const1_rtx,
5148                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
5149               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
5150               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
5151                                    OPTAB_LIB_WIDEN);
5152               expand_float (target, temp, 0);
5153
5154               /* Multiply by 2 to undo the shift above.  */
5155               temp = expand_binop (fmode, add_optab, target, target,
5156                                    target, 0, OPTAB_LIB_WIDEN);
5157               if (temp != target)
5158                 emit_move_insn (target, temp);
5159
5160               do_pending_stack_adjust ();
5161               emit_label (label);
5162               goto done;
5163             }
5164         }
5165
5166       /* If we are about to do some arithmetic to correct for an
5167          unsigned operand, do it in a pseudo-register.  */
5168
5169       if (GET_MODE (to) != fmode
5170           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
5171         target = gen_reg_rtx (fmode);
5172
5173       /* Convert as signed integer to floating.  */
5174       expand_float (target, from, 0);
5175
5176       /* If FROM is negative (and therefore TO is negative),
5177          correct its value by 2**bitwidth.  */
5178
5179       do_pending_stack_adjust ();
5180       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
5181                                0, label);
5182
5183
5184       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
5185       temp = expand_binop (fmode, add_optab, target,
5186                            CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode),
5187                            target, 0, OPTAB_LIB_WIDEN);
5188       if (temp != target)
5189         emit_move_insn (target, temp);
5190
5191       do_pending_stack_adjust ();
5192       emit_label (label);
5193       goto done;
5194     }
5195
5196   /* No hardware instruction available; call a library routine.  */
5197     {
5198       rtx libfunc;
5199       rtx_insn *insns;
5200       rtx value;
5201       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
5202
5203       if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_PRECISION (SImode))
5204         from = convert_to_mode (SImode, from, unsignedp);
5205
5206       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5207       gcc_assert (libfunc);
5208
5209       start_sequence ();
5210
5211       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5212                                        GET_MODE (to), 1, from,
5213                                        GET_MODE (from));
5214       insns = get_insns ();
5215       end_sequence ();
5216
5217       emit_libcall_block (insns, target, value,
5218                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
5219                                          GET_MODE (to), from));
5220     }
5221
5222  done:
5223
5224   /* Copy result to requested destination
5225      if we have been computing in a temp location.  */
5226
5227   if (target != to)
5228     {
5229       if (GET_MODE (target) == GET_MODE (to))
5230         emit_move_insn (to, target);
5231       else
5232         convert_move (to, target, 0);
5233     }
5234 }
5235 \f
5236 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5237    must be floating point.  */
5238
5239 void
5240 expand_fix (rtx to, rtx from, int unsignedp)
5241 {
5242   enum insn_code icode;
5243   rtx target = to;
5244   machine_mode fmode, imode;
5245   int must_trunc = 0;
5246
5247   /* We first try to find a pair of modes, one real and one integer, at
5248      least as wide as FROM and TO, respectively, in which we can open-code
5249      this conversion.  If the integer mode is wider than the mode of TO,
5250      we can do the conversion either signed or unsigned.  */
5251
5252   for (fmode = GET_MODE (from); fmode != VOIDmode;
5253        fmode = GET_MODE_WIDER_MODE (fmode))
5254     for (imode = GET_MODE (to); imode != VOIDmode;
5255          imode = GET_MODE_WIDER_MODE (imode))
5256       {
5257         int doing_unsigned = unsignedp;
5258
5259         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
5260         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
5261           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
5262
5263         if (icode != CODE_FOR_nothing)
5264           {
5265             rtx_insn *last = get_last_insn ();
5266             if (fmode != GET_MODE (from))
5267               from = convert_to_mode (fmode, from, 0);
5268
5269             if (must_trunc)
5270               {
5271                 rtx temp = gen_reg_rtx (GET_MODE (from));
5272                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
5273                                     temp, 0);
5274               }
5275
5276             if (imode != GET_MODE (to))
5277               target = gen_reg_rtx (imode);
5278
5279             if (maybe_emit_unop_insn (icode, target, from,
5280                                       doing_unsigned ? UNSIGNED_FIX : FIX))
5281               {
5282                 if (target != to)
5283                   convert_move (to, target, unsignedp);
5284                 return;
5285               }
5286             delete_insns_since (last);
5287           }
5288       }
5289
5290   /* For an unsigned conversion, there is one more way to do it.
5291      If we have a signed conversion, we generate code that compares
5292      the real value to the largest representable positive number.  If if
5293      is smaller, the conversion is done normally.  Otherwise, subtract
5294      one plus the highest signed number, convert, and add it back.
5295
5296      We only need to check all real modes, since we know we didn't find
5297      anything with a wider integer mode.
5298
5299      This code used to extend FP value into mode wider than the destination.
5300      This is needed for decimal float modes which cannot accurately
5301      represent one plus the highest signed number of the same size, but
5302      not for binary modes.  Consider, for instance conversion from SFmode
5303      into DImode.
5304
5305      The hot path through the code is dealing with inputs smaller than 2^63
5306      and doing just the conversion, so there is no bits to lose.
5307
5308      In the other path we know the value is positive in the range 2^63..2^64-1
5309      inclusive.  (as for other input overflow happens and result is undefined)
5310      So we know that the most important bit set in mantissa corresponds to
5311      2^63.  The subtraction of 2^63 should not generate any rounding as it
5312      simply clears out that bit.  The rest is trivial.  */
5313
5314   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
5315     for (fmode = GET_MODE (from); fmode != VOIDmode;
5316          fmode = GET_MODE_WIDER_MODE (fmode))
5317       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
5318           && (!DECIMAL_FLOAT_MODE_P (fmode)
5319               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
5320         {
5321           int bitsize;
5322           REAL_VALUE_TYPE offset;
5323           rtx limit;
5324           rtx_code_label *lab1, *lab2;
5325           rtx_insn *insn;
5326
5327           bitsize = GET_MODE_PRECISION (GET_MODE (to));
5328           real_2expN (&offset, bitsize - 1, fmode);
5329           limit = CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode);
5330           lab1 = gen_label_rtx ();
5331           lab2 = gen_label_rtx ();
5332
5333           if (fmode != GET_MODE (from))
5334             from = convert_to_mode (fmode, from, 0);
5335
5336           /* See if we need to do the subtraction.  */
5337           do_pending_stack_adjust ();
5338           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
5339                                    0, lab1);
5340
5341           /* If not, do the signed "fix" and branch around fixup code.  */
5342           expand_fix (to, from, 0);
5343           emit_jump_insn (gen_jump (lab2));
5344           emit_barrier ();
5345
5346           /* Otherwise, subtract 2**(N-1), convert to signed number,
5347              then add 2**(N-1).  Do the addition using XOR since this
5348              will often generate better code.  */
5349           emit_label (lab1);
5350           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5351                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
5352           expand_fix (to, target, 0);
5353           target = expand_binop (GET_MODE (to), xor_optab, to,
5354                                  gen_int_mode
5355                                  ((HOST_WIDE_INT) 1 << (bitsize - 1),
5356                                   GET_MODE (to)),
5357                                  to, 1, OPTAB_LIB_WIDEN);
5358
5359           if (target != to)
5360             emit_move_insn (to, target);
5361
5362           emit_label (lab2);
5363
5364           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
5365             {
5366               /* Make a place for a REG_NOTE and add it.  */
5367               insn = emit_move_insn (to, to);
5368               set_dst_reg_note (insn, REG_EQUAL,
5369                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
5370                                                copy_rtx (from)),
5371                                 to);
5372             }
5373
5374           return;
5375         }
5376
5377   /* We can't do it with an insn, so use a library call.  But first ensure
5378      that the mode of TO is at least as wide as SImode, since those are the
5379      only library calls we know about.  */
5380
5381   if (GET_MODE_PRECISION (GET_MODE (to)) < GET_MODE_PRECISION (SImode))
5382     {
5383       target = gen_reg_rtx (SImode);
5384
5385       expand_fix (target, from, unsignedp);
5386     }
5387   else
5388     {
5389       rtx_insn *insns;
5390       rtx value;
5391       rtx libfunc;
5392
5393       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5394       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5395       gcc_assert (libfunc);
5396
5397       start_sequence ();
5398
5399       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5400                                        GET_MODE (to), 1, from,
5401                                        GET_MODE (from));
5402       insns = get_insns ();
5403       end_sequence ();
5404
5405       emit_libcall_block (insns, target, value,
5406                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5407                                          GET_MODE (to), from));
5408     }
5409
5410   if (target != to)
5411     {
5412       if (GET_MODE (to) == GET_MODE (target))
5413         emit_move_insn (to, target);
5414       else
5415         convert_move (to, target, 0);
5416     }
5417 }
5418
5419 /* Generate code to convert FROM or TO a fixed-point.
5420    If UINTP is true, either TO or FROM is an unsigned integer.
5421    If SATP is true, we need to saturate the result.  */
5422
5423 void
5424 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5425 {
5426   machine_mode to_mode = GET_MODE (to);
5427   machine_mode from_mode = GET_MODE (from);
5428   convert_optab tab;
5429   enum rtx_code this_code;
5430   enum insn_code code;
5431   rtx_insn *insns;
5432   rtx value;
5433   rtx libfunc;
5434
5435   if (to_mode == from_mode)
5436     {
5437       emit_move_insn (to, from);
5438       return;
5439     }
5440
5441   if (uintp)
5442     {
5443       tab = satp ? satfractuns_optab : fractuns_optab;
5444       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5445     }
5446   else
5447     {
5448       tab = satp ? satfract_optab : fract_optab;
5449       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5450     }
5451   code = convert_optab_handler (tab, to_mode, from_mode);
5452   if (code != CODE_FOR_nothing)
5453     {
5454       emit_unop_insn (code, to, from, this_code);
5455       return;
5456     }
5457
5458   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5459   gcc_assert (libfunc);
5460
5461   start_sequence ();
5462   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5463                                    1, from, from_mode);
5464   insns = get_insns ();
5465   end_sequence ();
5466
5467   emit_libcall_block (insns, to, value,
5468                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5469 }
5470
5471 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5472    must be floating point, TO must be signed.  Use the conversion optab
5473    TAB to do the conversion.  */
5474
5475 bool
5476 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5477 {
5478   enum insn_code icode;
5479   rtx target = to;
5480   machine_mode fmode, imode;
5481
5482   /* We first try to find a pair of modes, one real and one integer, at
5483      least as wide as FROM and TO, respectively, in which we can open-code
5484      this conversion.  If the integer mode is wider than the mode of TO,
5485      we can do the conversion either signed or unsigned.  */
5486
5487   for (fmode = GET_MODE (from); fmode != VOIDmode;
5488        fmode = GET_MODE_WIDER_MODE (fmode))
5489     for (imode = GET_MODE (to); imode != VOIDmode;
5490          imode = GET_MODE_WIDER_MODE (imode))
5491       {
5492         icode = convert_optab_handler (tab, imode, fmode);
5493         if (icode != CODE_FOR_nothing)
5494           {
5495             rtx_insn *last = get_last_insn ();
5496             if (fmode != GET_MODE (from))
5497               from = convert_to_mode (fmode, from, 0);
5498
5499             if (imode != GET_MODE (to))
5500               target = gen_reg_rtx (imode);
5501
5502             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5503               {
5504                 delete_insns_since (last);
5505                 continue;
5506               }
5507             if (target != to)
5508               convert_move (to, target, 0);
5509             return true;
5510           }
5511       }
5512
5513   return false;
5514 }
5515 \f
5516 /* Report whether we have an instruction to perform the operation
5517    specified by CODE on operands of mode MODE.  */
5518 int
5519 have_insn_for (enum rtx_code code, machine_mode mode)
5520 {
5521   return (code_to_optab (code)
5522           && (optab_handler (code_to_optab (code), mode)
5523               != CODE_FOR_nothing));
5524 }
5525
5526 /* Initialize the libfunc fields of an entire group of entries in some
5527    optab.  Each entry is set equal to a string consisting of a leading
5528    pair of underscores followed by a generic operation name followed by
5529    a mode name (downshifted to lowercase) followed by a single character
5530    representing the number of operands for the given operation (which is
5531    usually one of the characters '2', '3', or '4').
5532
5533    OPTABLE is the table in which libfunc fields are to be initialized.
5534    OPNAME is the generic (string) name of the operation.
5535    SUFFIX is the character which specifies the number of operands for
5536      the given generic operation.
5537    MODE is the mode to generate for.
5538 */
5539
5540 static void
5541 gen_libfunc (optab optable, const char *opname, int suffix,
5542              machine_mode mode)
5543 {
5544   unsigned opname_len = strlen (opname);
5545   const char *mname = GET_MODE_NAME (mode);
5546   unsigned mname_len = strlen (mname);
5547   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5548   int len = prefix_len + opname_len + mname_len + 1 + 1;
5549   char *libfunc_name = XALLOCAVEC (char, len);
5550   char *p;
5551   const char *q;
5552
5553   p = libfunc_name;
5554   *p++ = '_';
5555   *p++ = '_';
5556   if (targetm.libfunc_gnu_prefix)
5557     {
5558       *p++ = 'g';
5559       *p++ = 'n';
5560       *p++ = 'u';
5561       *p++ = '_';
5562     }
5563   for (q = opname; *q; )
5564     *p++ = *q++;
5565   for (q = mname; *q; q++)
5566     *p++ = TOLOWER (*q);
5567   *p++ = suffix;
5568   *p = '\0';
5569
5570   set_optab_libfunc (optable, mode,
5571                      ggc_alloc_string (libfunc_name, p - libfunc_name));
5572 }
5573
5574 /* Like gen_libfunc, but verify that integer operation is involved.  */
5575
5576 void
5577 gen_int_libfunc (optab optable, const char *opname, char suffix,
5578                  machine_mode mode)
5579 {
5580   int maxsize = 2 * BITS_PER_WORD;
5581   int minsize = BITS_PER_WORD;
5582
5583   if (GET_MODE_CLASS (mode) != MODE_INT)
5584     return;
5585   if (maxsize < LONG_LONG_TYPE_SIZE)
5586     maxsize = LONG_LONG_TYPE_SIZE;
5587   if (minsize > INT_TYPE_SIZE
5588       && (trapv_binoptab_p (optable)
5589           || trapv_unoptab_p (optable)))
5590     minsize = INT_TYPE_SIZE;
5591   if (GET_MODE_BITSIZE (mode) < minsize
5592       || GET_MODE_BITSIZE (mode) > maxsize)
5593     return;
5594   gen_libfunc (optable, opname, suffix, mode);
5595 }
5596
5597 /* Like gen_libfunc, but verify that FP and set decimal prefix if needed.  */
5598
5599 void
5600 gen_fp_libfunc (optab optable, const char *opname, char suffix,
5601                 machine_mode mode)
5602 {
5603   char *dec_opname;
5604
5605   if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5606     gen_libfunc (optable, opname, suffix, mode);
5607   if (DECIMAL_FLOAT_MODE_P (mode))
5608     {
5609       dec_opname = XALLOCAVEC (char, sizeof (DECIMAL_PREFIX) + strlen (opname));
5610       /* For BID support, change the name to have either a bid_ or dpd_ prefix
5611          depending on the low level floating format used.  */
5612       memcpy (dec_opname, DECIMAL_PREFIX, sizeof (DECIMAL_PREFIX) - 1);
5613       strcpy (dec_opname + sizeof (DECIMAL_PREFIX) - 1, opname);
5614       gen_libfunc (optable, dec_opname, suffix, mode);
5615     }
5616 }
5617
5618 /* Like gen_libfunc, but verify that fixed-point operation is involved.  */
5619
5620 void
5621 gen_fixed_libfunc (optab optable, const char *opname, char suffix,
5622                    machine_mode mode)
5623 {
5624   if (!ALL_FIXED_POINT_MODE_P (mode))
5625     return;
5626   gen_libfunc (optable, opname, suffix, mode);
5627 }
5628
5629 /* Like gen_libfunc, but verify that signed fixed-point operation is
5630    involved.  */
5631
5632 void
5633 gen_signed_fixed_libfunc (optab optable, const char *opname, char suffix,
5634                           machine_mode mode)
5635 {
5636   if (!SIGNED_FIXED_POINT_MODE_P (mode))
5637     return;
5638   gen_libfunc (optable, opname, suffix, mode);
5639 }
5640
5641 /* Like gen_libfunc, but verify that unsigned fixed-point operation is
5642    involved.  */
5643
5644 void
5645 gen_unsigned_fixed_libfunc (optab optable, const char *opname, char suffix,
5646                             machine_mode mode)
5647 {
5648   if (!UNSIGNED_FIXED_POINT_MODE_P (mode))
5649     return;
5650   gen_libfunc (optable, opname, suffix, mode);
5651 }
5652
5653 /* Like gen_libfunc, but verify that FP or INT operation is involved.  */
5654
5655 void
5656 gen_int_fp_libfunc (optab optable, const char *name, char suffix,
5657                     machine_mode mode)
5658 {
5659   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5660     gen_fp_libfunc (optable, name, suffix, mode);
5661   if (INTEGRAL_MODE_P (mode))
5662     gen_int_libfunc (optable, name, suffix, mode);
5663 }
5664
5665 /* Like gen_libfunc, but verify that FP or INT operation is involved
5666    and add 'v' suffix for integer operation.  */
5667
5668 void
5669 gen_intv_fp_libfunc (optab optable, const char *name, char suffix,
5670                      machine_mode mode)
5671 {
5672   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5673     gen_fp_libfunc (optable, name, suffix, mode);
5674   if (GET_MODE_CLASS (mode) == MODE_INT)
5675     {
5676       int len = strlen (name);
5677       char *v_name = XALLOCAVEC (char, len + 2);
5678       strcpy (v_name, name);
5679       v_name[len] = 'v';
5680       v_name[len + 1] = 0;
5681       gen_int_libfunc (optable, v_name, suffix, mode);
5682     }
5683 }
5684
5685 /* Like gen_libfunc, but verify that FP or INT or FIXED operation is
5686    involved.  */
5687
5688 void
5689 gen_int_fp_fixed_libfunc (optab optable, const char *name, char suffix,
5690                           machine_mode mode)
5691 {
5692   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5693     gen_fp_libfunc (optable, name, suffix, mode);
5694   if (INTEGRAL_MODE_P (mode))
5695     gen_int_libfunc (optable, name, suffix, mode);
5696   if (ALL_FIXED_POINT_MODE_P (mode))
5697     gen_fixed_libfunc (optable, name, suffix, mode);
5698 }
5699
5700 /* Like gen_libfunc, but verify that FP or INT or signed FIXED operation is
5701    involved.  */
5702
5703 void
5704 gen_int_fp_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5705                                  machine_mode mode)
5706 {
5707   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5708     gen_fp_libfunc (optable, name, suffix, mode);
5709   if (INTEGRAL_MODE_P (mode))
5710     gen_int_libfunc (optable, name, suffix, mode);
5711   if (SIGNED_FIXED_POINT_MODE_P (mode))
5712     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5713 }
5714
5715 /* Like gen_libfunc, but verify that INT or FIXED operation is
5716    involved.  */
5717
5718 void
5719 gen_int_fixed_libfunc (optab optable, const char *name, char suffix,
5720                        machine_mode mode)
5721 {
5722   if (INTEGRAL_MODE_P (mode))
5723     gen_int_libfunc (optable, name, suffix, mode);
5724   if (ALL_FIXED_POINT_MODE_P (mode))
5725     gen_fixed_libfunc (optable, name, suffix, mode);
5726 }
5727
5728 /* Like gen_libfunc, but verify that INT or signed FIXED operation is
5729    involved.  */
5730
5731 void
5732 gen_int_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5733                               machine_mode mode)
5734 {
5735   if (INTEGRAL_MODE_P (mode))
5736     gen_int_libfunc (optable, name, suffix, mode);
5737   if (SIGNED_FIXED_POINT_MODE_P (mode))
5738     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5739 }
5740
5741 /* Like gen_libfunc, but verify that INT or unsigned FIXED operation is
5742    involved.  */
5743
5744 void
5745 gen_int_unsigned_fixed_libfunc (optab optable, const char *name, char suffix,
5746                                 machine_mode mode)
5747 {
5748   if (INTEGRAL_MODE_P (mode))
5749     gen_int_libfunc (optable, name, suffix, mode);
5750   if (UNSIGNED_FIXED_POINT_MODE_P (mode))
5751     gen_unsigned_fixed_libfunc (optable, name, suffix, mode);
5752 }
5753
5754 /* Initialize the libfunc fields of an entire group of entries of an
5755    inter-mode-class conversion optab.  The string formation rules are
5756    similar to the ones for init_libfuncs, above, but instead of having
5757    a mode name and an operand count these functions have two mode names
5758    and no operand count.  */
5759
5760 void
5761 gen_interclass_conv_libfunc (convert_optab tab,
5762                              const char *opname,
5763                              machine_mode tmode,
5764                              machine_mode fmode)
5765 {
5766   size_t opname_len = strlen (opname);
5767   size_t mname_len = 0;
5768
5769   const char *fname, *tname;
5770   const char *q;
5771   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5772   char *libfunc_name, *suffix;
5773   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5774   char *p;
5775
5776   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5777      depends on which underlying decimal floating point format is used.  */
5778   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5779
5780   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5781
5782   nondec_name = XALLOCAVEC (char, prefix_len + opname_len + mname_len + 1 + 1);
5783   nondec_name[0] = '_';
5784   nondec_name[1] = '_';
5785   if (targetm.libfunc_gnu_prefix)
5786     {
5787       nondec_name[2] = 'g';
5788       nondec_name[3] = 'n';
5789       nondec_name[4] = 'u';
5790       nondec_name[5] = '_';
5791     }
5792
5793   memcpy (&nondec_name[prefix_len], opname, opname_len);
5794   nondec_suffix = nondec_name + opname_len + prefix_len;
5795
5796   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5797   dec_name[0] = '_';
5798   dec_name[1] = '_';
5799   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5800   memcpy (&dec_name[2+dec_len], opname, opname_len);
5801   dec_suffix = dec_name + dec_len + opname_len + 2;
5802
5803   fname = GET_MODE_NAME (fmode);
5804   tname = GET_MODE_NAME (tmode);
5805
5806   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5807     {
5808       libfunc_name = dec_name;
5809       suffix = dec_suffix;
5810     }
5811   else
5812     {
5813       libfunc_name = nondec_name;
5814       suffix = nondec_suffix;
5815     }
5816
5817   p = suffix;
5818   for (q = fname; *q; p++, q++)
5819     *p = TOLOWER (*q);
5820   for (q = tname; *q; p++, q++)
5821     *p = TOLOWER (*q);
5822
5823   *p = '\0';
5824
5825   set_conv_libfunc (tab, tmode, fmode,
5826                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5827 }
5828
5829 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5830    int->fp conversion.  */
5831
5832 void
5833 gen_int_to_fp_conv_libfunc (convert_optab tab,
5834                             const char *opname,
5835                             machine_mode tmode,
5836                             machine_mode fmode)
5837 {
5838   if (GET_MODE_CLASS (fmode) != MODE_INT)
5839     return;
5840   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5841     return;
5842   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5843 }
5844
5845 /* ufloat_optab is special by using floatun for FP and floatuns decimal fp
5846    naming scheme.  */
5847
5848 void
5849 gen_ufloat_conv_libfunc (convert_optab tab,
5850                          const char *opname ATTRIBUTE_UNUSED,
5851                          machine_mode tmode,
5852                          machine_mode fmode)
5853 {
5854   if (DECIMAL_FLOAT_MODE_P (tmode))
5855     gen_int_to_fp_conv_libfunc (tab, "floatuns", tmode, fmode);
5856   else
5857     gen_int_to_fp_conv_libfunc (tab, "floatun", tmode, fmode);
5858 }
5859
5860 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5861    fp->int conversion.  */
5862
5863 void
5864 gen_int_to_fp_nondecimal_conv_libfunc (convert_optab tab,
5865                                        const char *opname,
5866                                        machine_mode tmode,
5867                                        machine_mode fmode)
5868 {
5869   if (GET_MODE_CLASS (fmode) != MODE_INT)
5870     return;
5871   if (GET_MODE_CLASS (tmode) != MODE_FLOAT)
5872     return;
5873   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5874 }
5875
5876 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5877    fp->int conversion with no decimal floating point involved.  */
5878
5879 void
5880 gen_fp_to_int_conv_libfunc (convert_optab tab,
5881                             const char *opname,
5882                             machine_mode tmode,
5883                             machine_mode fmode)
5884 {
5885   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5886     return;
5887   if (GET_MODE_CLASS (tmode) != MODE_INT)
5888     return;
5889   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5890 }
5891
5892 /* Initialize the libfunc fields of an of an intra-mode-class conversion optab.
5893    The string formation rules are
5894    similar to the ones for init_libfunc, above.  */
5895
5896 void
5897 gen_intraclass_conv_libfunc (convert_optab tab, const char *opname,
5898                              machine_mode tmode, machine_mode fmode)
5899 {
5900   size_t opname_len = strlen (opname);
5901   size_t mname_len = 0;
5902
5903   const char *fname, *tname;
5904   const char *q;
5905   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5906   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5907   char *libfunc_name, *suffix;
5908   char *p;
5909
5910   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5911      depends on which underlying decimal floating point format is used.  */
5912   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5913
5914   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5915
5916   nondec_name = XALLOCAVEC (char, 2 + opname_len + mname_len + 1 + 1);
5917   nondec_name[0] = '_';
5918   nondec_name[1] = '_';
5919   if (targetm.libfunc_gnu_prefix)
5920     {
5921       nondec_name[2] = 'g';
5922       nondec_name[3] = 'n';
5923       nondec_name[4] = 'u';
5924       nondec_name[5] = '_';
5925     }
5926   memcpy (&nondec_name[prefix_len], opname, opname_len);
5927   nondec_suffix = nondec_name + opname_len + prefix_len;
5928
5929   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5930   dec_name[0] = '_';
5931   dec_name[1] = '_';
5932   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5933   memcpy (&dec_name[2 + dec_len], opname, opname_len);
5934   dec_suffix = dec_name + dec_len + opname_len + 2;
5935
5936   fname = GET_MODE_NAME (fmode);
5937   tname = GET_MODE_NAME (tmode);
5938
5939   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5940     {
5941       libfunc_name = dec_name;
5942       suffix = dec_suffix;
5943     }
5944   else
5945     {
5946       libfunc_name = nondec_name;
5947       suffix = nondec_suffix;
5948     }
5949
5950   p = suffix;
5951   for (q = fname; *q; p++, q++)
5952     *p = TOLOWER (*q);
5953   for (q = tname; *q; p++, q++)
5954     *p = TOLOWER (*q);
5955
5956   *p++ = '2';
5957   *p = '\0';
5958
5959   set_conv_libfunc (tab, tmode, fmode,
5960                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5961 }
5962
5963 /* Pick proper libcall for trunc_optab.  We need to chose if we do
5964    truncation or extension and interclass or intraclass.  */
5965
5966 void
5967 gen_trunc_conv_libfunc (convert_optab tab,
5968                          const char *opname,
5969                          machine_mode tmode,
5970                          machine_mode fmode)
5971 {
5972   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5973     return;
5974   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5975     return;
5976   if (tmode == fmode)
5977     return;
5978
5979   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5980       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5981      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5982
5983   if (GET_MODE_PRECISION (fmode) <= GET_MODE_PRECISION (tmode))
5984     return;
5985
5986   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5987        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5988       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5989     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5990 }
5991
5992 /* Pick proper libcall for extend_optab.  We need to chose if we do
5993    truncation or extension and interclass or intraclass.  */
5994
5995 void
5996 gen_extend_conv_libfunc (convert_optab tab,
5997                          const char *opname ATTRIBUTE_UNUSED,
5998                          machine_mode tmode,
5999                          machine_mode fmode)
6000 {
6001   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
6002     return;
6003   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
6004     return;
6005   if (tmode == fmode)
6006     return;
6007
6008   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
6009       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
6010      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6011
6012   if (GET_MODE_PRECISION (fmode) > GET_MODE_PRECISION (tmode))
6013     return;
6014
6015   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
6016        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
6017       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
6018     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6019 }
6020
6021 /* Pick proper libcall for fract_optab.  We need to chose if we do
6022    interclass or intraclass.  */
6023
6024 void
6025 gen_fract_conv_libfunc (convert_optab tab,
6026                         const char *opname,
6027                         machine_mode tmode,
6028                         machine_mode fmode)
6029 {
6030   if (tmode == fmode)
6031     return;
6032   if (!(ALL_FIXED_POINT_MODE_P (tmode) || ALL_FIXED_POINT_MODE_P (fmode)))
6033     return;
6034
6035   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6036     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6037   else
6038     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6039 }
6040
6041 /* Pick proper libcall for fractuns_optab.  */
6042
6043 void
6044 gen_fractuns_conv_libfunc (convert_optab tab,
6045                            const char *opname,
6046                            machine_mode tmode,
6047                            machine_mode fmode)
6048 {
6049   if (tmode == fmode)
6050     return;
6051   /* One mode must be a fixed-point mode, and the other must be an integer
6052      mode. */
6053   if (!((ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT)
6054         || (ALL_FIXED_POINT_MODE_P (fmode)
6055             && GET_MODE_CLASS (tmode) == MODE_INT)))
6056     return;
6057
6058   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6059 }
6060
6061 /* Pick proper libcall for satfract_optab.  We need to chose if we do
6062    interclass or intraclass.  */
6063
6064 void
6065 gen_satfract_conv_libfunc (convert_optab tab,
6066                            const char *opname,
6067                            machine_mode tmode,
6068                            machine_mode fmode)
6069 {
6070   if (tmode == fmode)
6071     return;
6072   /* TMODE must be a fixed-point mode.  */
6073   if (!ALL_FIXED_POINT_MODE_P (tmode))
6074     return;
6075
6076   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6077     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6078   else
6079     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6080 }
6081
6082 /* Pick proper libcall for satfractuns_optab.  */
6083
6084 void
6085 gen_satfractuns_conv_libfunc (convert_optab tab,
6086                               const char *opname,
6087                               machine_mode tmode,
6088                               machine_mode fmode)
6089 {
6090   if (tmode == fmode)
6091     return;
6092   /* TMODE must be a fixed-point mode, and FMODE must be an integer mode. */
6093   if (!(ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT))
6094     return;
6095
6096   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6097 }
6098
6099 /* Hashtable callbacks for libfunc_decls.  */
6100
6101 struct libfunc_decl_hasher : ggc_hasher<tree>
6102 {
6103   static hashval_t
6104   hash (tree entry)
6105   {
6106     return IDENTIFIER_HASH_VALUE (DECL_NAME (entry));
6107   }
6108
6109   static bool
6110   equal (tree decl, tree name)
6111   {
6112     return DECL_NAME (decl) == name;
6113   }
6114 };
6115
6116 /* A table of previously-created libfuncs, hashed by name.  */
6117 static GTY (()) hash_table<libfunc_decl_hasher> *libfunc_decls;
6118
6119 /* Build a decl for a libfunc named NAME. */
6120
6121 tree
6122 build_libfunc_function (const char *name)
6123 {
6124   tree decl = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL,
6125                           get_identifier (name),
6126                           build_function_type (integer_type_node, NULL_TREE));
6127   /* ??? We don't have any type information except for this is
6128      a function.  Pretend this is "int foo()".  */
6129   DECL_ARTIFICIAL (decl) = 1;
6130   DECL_EXTERNAL (decl) = 1;
6131   TREE_PUBLIC (decl) = 1;
6132   gcc_assert (DECL_ASSEMBLER_NAME (decl));
6133
6134   /* Zap the nonsensical SYMBOL_REF_DECL for this.  What we're left with
6135      are the flags assigned by targetm.encode_section_info.  */
6136   SET_SYMBOL_REF_DECL (XEXP (DECL_RTL (decl), 0), NULL);
6137
6138   return decl;
6139 }
6140
6141 rtx
6142 init_one_libfunc (const char *name)
6143 {
6144   tree id, decl;
6145   hashval_t hash;
6146
6147   if (libfunc_decls == NULL)
6148     libfunc_decls = hash_table<libfunc_decl_hasher>::create_ggc (37);
6149
6150   /* See if we have already created a libfunc decl for this function.  */
6151   id = get_identifier (name);
6152   hash = IDENTIFIER_HASH_VALUE (id);
6153   tree *slot = libfunc_decls->find_slot_with_hash (id, hash, INSERT);
6154   decl = *slot;
6155   if (decl == NULL)
6156     {
6157       /* Create a new decl, so that it can be passed to
6158          targetm.encode_section_info.  */
6159       decl = build_libfunc_function (name);
6160       *slot = decl;
6161     }
6162   return XEXP (DECL_RTL (decl), 0);
6163 }
6164
6165 /* Adjust the assembler name of libfunc NAME to ASMSPEC.  */
6166
6167 rtx
6168 set_user_assembler_libfunc (const char *name, const char *asmspec)
6169 {
6170   tree id, decl;
6171   hashval_t hash;
6172
6173   id = get_identifier (name);
6174   hash = IDENTIFIER_HASH_VALUE (id);
6175   tree *slot = libfunc_decls->find_slot_with_hash (id, hash, NO_INSERT);
6176   gcc_assert (slot);
6177   decl = (tree) *slot;
6178   set_user_assembler_name (decl, asmspec);
6179   return XEXP (DECL_RTL (decl), 0);
6180 }
6181
6182 /* Call this to reset the function entry for one optab (OPTABLE) in mode
6183    MODE to NAME, which should be either 0 or a string constant.  */
6184 void
6185 set_optab_libfunc (optab op, machine_mode mode, const char *name)
6186 {
6187   rtx val;
6188   struct libfunc_entry e;
6189   struct libfunc_entry **slot;
6190
6191   e.op = op;
6192   e.mode1 = mode;
6193   e.mode2 = VOIDmode;
6194
6195   if (name)
6196     val = init_one_libfunc (name);
6197   else
6198     val = 0;
6199   slot = libfunc_hash->find_slot (&e, INSERT);
6200   if (*slot == NULL)
6201     *slot = ggc_alloc<libfunc_entry> ();
6202   (*slot)->op = op;
6203   (*slot)->mode1 = mode;
6204   (*slot)->mode2 = VOIDmode;
6205   (*slot)->libfunc = val;
6206 }
6207
6208 /* Call this to reset the function entry for one conversion optab
6209    (OPTABLE) from mode FMODE to mode TMODE to NAME, which should be
6210    either 0 or a string constant.  */
6211 void
6212 set_conv_libfunc (convert_optab optab, machine_mode tmode,
6213                   machine_mode fmode, const char *name)
6214 {
6215   rtx val;
6216   struct libfunc_entry e;
6217   struct libfunc_entry **slot;
6218
6219   e.op = optab;
6220   e.mode1 = tmode;
6221   e.mode2 = fmode;
6222
6223   if (name)
6224     val = init_one_libfunc (name);
6225   else
6226     val = 0;
6227   slot = libfunc_hash->find_slot (&e, INSERT);
6228   if (*slot == NULL)
6229     *slot = ggc_alloc<libfunc_entry> ();
6230   (*slot)->op = optab;
6231   (*slot)->mode1 = tmode;
6232   (*slot)->mode2 = fmode;
6233   (*slot)->libfunc = val;
6234 }
6235
6236 /* Call this to initialize the contents of the optabs
6237    appropriately for the current target machine.  */
6238
6239 void
6240 init_optabs (void)
6241 {
6242   if (libfunc_hash)
6243     libfunc_hash->empty ();
6244   else
6245     libfunc_hash = hash_table<libfunc_hasher>::create_ggc (10);
6246
6247   /* Fill in the optabs with the insns we support.  */
6248   init_all_optabs (this_fn_optabs);
6249
6250   /* The ffs function operates on `int'.  Fall back on it if we do not
6251      have a libgcc2 function for that width.  */
6252   if (INT_TYPE_SIZE < BITS_PER_WORD)
6253     set_optab_libfunc (ffs_optab, mode_for_size (INT_TYPE_SIZE, MODE_INT, 0),
6254                        "ffs");
6255
6256   /* Explicitly initialize the bswap libfuncs since we need them to be
6257      valid for things other than word_mode.  */
6258   if (targetm.libfunc_gnu_prefix)
6259     {
6260       set_optab_libfunc (bswap_optab, SImode, "__gnu_bswapsi2");
6261       set_optab_libfunc (bswap_optab, DImode, "__gnu_bswapdi2");
6262     }
6263   else
6264     {
6265       set_optab_libfunc (bswap_optab, SImode, "__bswapsi2");
6266       set_optab_libfunc (bswap_optab, DImode, "__bswapdi2");
6267     }
6268
6269   /* Use cabs for double complex abs, since systems generally have cabs.
6270      Don't define any libcall for float complex, so that cabs will be used.  */
6271   if (complex_double_type_node)
6272     set_optab_libfunc (abs_optab, TYPE_MODE (complex_double_type_node),
6273                        "cabs");
6274
6275   abort_libfunc = init_one_libfunc ("abort");
6276   memcpy_libfunc = init_one_libfunc ("memcpy");
6277   memmove_libfunc = init_one_libfunc ("memmove");
6278   memcmp_libfunc = init_one_libfunc ("memcmp");
6279   memset_libfunc = init_one_libfunc ("memset");
6280   setbits_libfunc = init_one_libfunc ("__setbits");
6281
6282 #ifndef DONT_USE_BUILTIN_SETJMP
6283   setjmp_libfunc = init_one_libfunc ("__builtin_setjmp");
6284   longjmp_libfunc = init_one_libfunc ("__builtin_longjmp");
6285 #else
6286   setjmp_libfunc = init_one_libfunc ("setjmp");
6287   longjmp_libfunc = init_one_libfunc ("longjmp");
6288 #endif
6289   unwind_sjlj_register_libfunc = init_one_libfunc ("_Unwind_SjLj_Register");
6290   unwind_sjlj_unregister_libfunc
6291     = init_one_libfunc ("_Unwind_SjLj_Unregister");
6292
6293   /* For function entry/exit instrumentation.  */
6294   profile_function_entry_libfunc
6295     = init_one_libfunc ("__cyg_profile_func_enter");
6296   profile_function_exit_libfunc
6297     = init_one_libfunc ("__cyg_profile_func_exit");
6298
6299   gcov_flush_libfunc = init_one_libfunc ("__gcov_flush");
6300
6301   /* Allow the target to add more libcalls or rename some, etc.  */
6302   targetm.init_libfuncs ();
6303 }
6304
6305 /* Use the current target and options to initialize
6306    TREE_OPTIMIZATION_OPTABS (OPTNODE).  */
6307
6308 void
6309 init_tree_optimization_optabs (tree optnode)
6310 {
6311   /* Quick exit if we have already computed optabs for this target.  */
6312   if (TREE_OPTIMIZATION_BASE_OPTABS (optnode) == this_target_optabs)
6313     return;
6314
6315   /* Forget any previous information and set up for the current target.  */
6316   TREE_OPTIMIZATION_BASE_OPTABS (optnode) = this_target_optabs;
6317   struct target_optabs *tmp_optabs = (struct target_optabs *)
6318     TREE_OPTIMIZATION_OPTABS (optnode);
6319   if (tmp_optabs)
6320     memset (tmp_optabs, 0, sizeof (struct target_optabs));
6321   else
6322     tmp_optabs = ggc_alloc<target_optabs> ();
6323
6324   /* Generate a new set of optabs into tmp_optabs.  */
6325   init_all_optabs (tmp_optabs);
6326
6327   /* If the optabs changed, record it.  */
6328   if (memcmp (tmp_optabs, this_target_optabs, sizeof (struct target_optabs)))
6329     TREE_OPTIMIZATION_OPTABS (optnode) = tmp_optabs;
6330   else
6331     {
6332       TREE_OPTIMIZATION_OPTABS (optnode) = NULL;
6333       ggc_free (tmp_optabs);
6334     }
6335 }
6336
6337 /* A helper function for init_sync_libfuncs.  Using the basename BASE,
6338    install libfuncs into TAB for BASE_N for 1 <= N <= MAX.  */
6339
6340 static void
6341 init_sync_libfuncs_1 (optab tab, const char *base, int max)
6342 {
6343   machine_mode mode;
6344   char buf[64];
6345   size_t len = strlen (base);
6346   int i;
6347
6348   gcc_assert (max <= 8);
6349   gcc_assert (len + 3 < sizeof (buf));
6350
6351   memcpy (buf, base, len);
6352   buf[len] = '_';
6353   buf[len + 1] = '0';
6354   buf[len + 2] = '\0';
6355
6356   mode = QImode;
6357   for (i = 1; i <= max; i *= 2)
6358     {
6359       buf[len + 1] = '0' + i;
6360       set_optab_libfunc (tab, mode, buf);
6361       mode = GET_MODE_2XWIDER_MODE (mode);
6362     }
6363 }
6364
6365 void
6366 init_sync_libfuncs (int max)
6367 {
6368   if (!flag_sync_libcalls)
6369     return;
6370
6371   init_sync_libfuncs_1 (sync_compare_and_swap_optab,
6372                         "__sync_val_compare_and_swap", max);
6373   init_sync_libfuncs_1 (sync_lock_test_and_set_optab,
6374                         "__sync_lock_test_and_set", max);
6375
6376   init_sync_libfuncs_1 (sync_old_add_optab, "__sync_fetch_and_add", max);
6377   init_sync_libfuncs_1 (sync_old_sub_optab, "__sync_fetch_and_sub", max);
6378   init_sync_libfuncs_1 (sync_old_ior_optab, "__sync_fetch_and_or", max);
6379   init_sync_libfuncs_1 (sync_old_and_optab, "__sync_fetch_and_and", max);
6380   init_sync_libfuncs_1 (sync_old_xor_optab, "__sync_fetch_and_xor", max);
6381   init_sync_libfuncs_1 (sync_old_nand_optab, "__sync_fetch_and_nand", max);
6382
6383   init_sync_libfuncs_1 (sync_new_add_optab, "__sync_add_and_fetch", max);
6384   init_sync_libfuncs_1 (sync_new_sub_optab, "__sync_sub_and_fetch", max);
6385   init_sync_libfuncs_1 (sync_new_ior_optab, "__sync_or_and_fetch", max);
6386   init_sync_libfuncs_1 (sync_new_and_optab, "__sync_and_and_fetch", max);
6387   init_sync_libfuncs_1 (sync_new_xor_optab, "__sync_xor_and_fetch", max);
6388   init_sync_libfuncs_1 (sync_new_nand_optab, "__sync_nand_and_fetch", max);
6389 }
6390
6391 /* Print information about the current contents of the optabs on
6392    STDERR.  */
6393
6394 DEBUG_FUNCTION void
6395 debug_optab_libfuncs (void)
6396 {
6397   int i, j, k;
6398
6399   /* Dump the arithmetic optabs.  */
6400   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
6401     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6402       {
6403         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
6404         if (l)
6405           {
6406             gcc_assert (GET_CODE (l) == SYMBOL_REF);
6407             fprintf (stderr, "%s\t%s:\t%s\n",
6408                      GET_RTX_NAME (optab_to_code ((optab) i)),
6409                      GET_MODE_NAME (j),
6410                      XSTR (l, 0));
6411           }
6412       }
6413
6414   /* Dump the conversion optabs.  */
6415   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
6416     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6417       for (k = 0; k < NUM_MACHINE_MODES; ++k)
6418         {
6419           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
6420                                          (machine_mode) k);
6421           if (l)
6422             {
6423               gcc_assert (GET_CODE (l) == SYMBOL_REF);
6424               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
6425                        GET_RTX_NAME (optab_to_code ((optab) i)),
6426                        GET_MODE_NAME (j),
6427                        GET_MODE_NAME (k),
6428                        XSTR (l, 0));
6429             }
6430         }
6431 }
6432
6433 \f
6434 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
6435    CODE.  Return 0 on failure.  */
6436
6437 rtx
6438 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
6439 {
6440   machine_mode mode = GET_MODE (op1);
6441   enum insn_code icode;
6442   rtx insn;
6443   rtx trap_rtx;
6444
6445   if (mode == VOIDmode)
6446     return 0;
6447
6448   icode = optab_handler (ctrap_optab, mode);
6449   if (icode == CODE_FOR_nothing)
6450     return 0;
6451
6452   /* Some targets only accept a zero trap code.  */
6453   if (!insn_operand_matches (icode, 3, tcode))
6454     return 0;
6455
6456   do_pending_stack_adjust ();
6457   start_sequence ();
6458   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
6459                     &trap_rtx, &mode);
6460   if (!trap_rtx)
6461     insn = NULL_RTX;
6462   else
6463     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
6464                             tcode);
6465
6466   /* If that failed, then give up.  */
6467   if (insn == 0)
6468     {
6469       end_sequence ();
6470       return 0;
6471     }
6472
6473   emit_insn (insn);
6474   insn = get_insns ();
6475   end_sequence ();
6476   return insn;
6477 }
6478
6479 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
6480    or unsigned operation code.  */
6481
6482 static enum rtx_code
6483 get_rtx_code (enum tree_code tcode, bool unsignedp)
6484 {
6485   enum rtx_code code;
6486   switch (tcode)
6487     {
6488     case EQ_EXPR:
6489       code = EQ;
6490       break;
6491     case NE_EXPR:
6492       code = NE;
6493       break;
6494     case LT_EXPR:
6495       code = unsignedp ? LTU : LT;
6496       break;
6497     case LE_EXPR:
6498       code = unsignedp ? LEU : LE;
6499       break;
6500     case GT_EXPR:
6501       code = unsignedp ? GTU : GT;
6502       break;
6503     case GE_EXPR:
6504       code = unsignedp ? GEU : GE;
6505       break;
6506
6507     case UNORDERED_EXPR:
6508       code = UNORDERED;
6509       break;
6510     case ORDERED_EXPR:
6511       code = ORDERED;
6512       break;
6513     case UNLT_EXPR:
6514       code = UNLT;
6515       break;
6516     case UNLE_EXPR:
6517       code = UNLE;
6518       break;
6519     case UNGT_EXPR:
6520       code = UNGT;
6521       break;
6522     case UNGE_EXPR:
6523       code = UNGE;
6524       break;
6525     case UNEQ_EXPR:
6526       code = UNEQ;
6527       break;
6528     case LTGT_EXPR:
6529       code = LTGT;
6530       break;
6531
6532     default:
6533       gcc_unreachable ();
6534     }
6535   return code;
6536 }
6537
6538 /* Return comparison rtx for COND. Use UNSIGNEDP to select signed or
6539    unsigned operators. Do not generate compare instruction.  */
6540
6541 static rtx
6542 vector_compare_rtx (enum tree_code tcode, tree t_op0, tree t_op1,
6543                     bool unsignedp, enum insn_code icode)
6544 {
6545   struct expand_operand ops[2];
6546   rtx rtx_op0, rtx_op1;
6547   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
6548
6549   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
6550
6551   /* Expand operands.  */
6552   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
6553                          EXPAND_STACK_PARM);
6554   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
6555                          EXPAND_STACK_PARM);
6556
6557   create_input_operand (&ops[0], rtx_op0, GET_MODE (rtx_op0));
6558   create_input_operand (&ops[1], rtx_op1, GET_MODE (rtx_op1));
6559   if (!maybe_legitimize_operands (icode, 4, 2, ops))
6560     gcc_unreachable ();
6561   return gen_rtx_fmt_ee (rcode, VOIDmode, ops[0].value, ops[1].value);
6562 }
6563
6564 /* Return true if VEC_PERM_EXPR can be expanded using SIMD extensions
6565    of the CPU.  SEL may be NULL, which stands for an unknown constant.  */
6566
6567 bool
6568 can_vec_perm_p (machine_mode mode, bool variable,
6569                 const unsigned char *sel)
6570 {
6571   machine_mode qimode;
6572
6573   /* If the target doesn't implement a vector mode for the vector type,
6574      then no operations are supported.  */
6575   if (!VECTOR_MODE_P (mode))
6576     return false;
6577
6578   if (!variable)
6579     {
6580       if (direct_optab_handler (vec_perm_const_optab, mode) != CODE_FOR_nothing
6581           && (sel == NULL
6582               || targetm.vectorize.vec_perm_const_ok == NULL
6583               || targetm.vectorize.vec_perm_const_ok (mode, sel)))
6584         return true;
6585     }
6586
6587   if (direct_optab_handler (vec_perm_optab, mode) != CODE_FOR_nothing)
6588     return true;
6589
6590   /* We allow fallback to a QI vector mode, and adjust the mask.  */
6591   if (GET_MODE_INNER (mode) == QImode)
6592     return false;
6593   qimode = mode_for_vector (QImode, GET_MODE_SIZE (mode));
6594   if (!VECTOR_MODE_P (qimode))
6595     return false;
6596
6597   /* ??? For completeness, we ought to check the QImode version of
6598       vec_perm_const_optab.  But all users of this implicit lowering
6599       feature implement the variable vec_perm_optab.  */
6600   if (direct_optab_handler (vec_perm_optab, qimode) == CODE_FOR_nothing)
6601     return false;
6602
6603   /* In order to support the lowering of variable permutations,
6604      we need to support shifts and adds.  */
6605   if (variable)
6606     {
6607       if (GET_MODE_UNIT_SIZE (mode) > 2
6608           && optab_handler (ashl_optab, mode) == CODE_FOR_nothing
6609           && optab_handler (vashl_optab, mode) == CODE_FOR_nothing)
6610         return false;
6611       if (optab_handler (add_optab, qimode) == CODE_FOR_nothing)
6612         return false;
6613     }
6614
6615   return true;
6616 }
6617
6618 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
6619
6620 static rtx
6621 expand_vec_perm_1 (enum insn_code icode, rtx target,
6622                    rtx v0, rtx v1, rtx sel)
6623 {
6624   machine_mode tmode = GET_MODE (target);
6625   machine_mode smode = GET_MODE (sel);
6626   struct expand_operand ops[4];
6627
6628   create_output_operand (&ops[0], target, tmode);
6629   create_input_operand (&ops[3], sel, smode);
6630
6631   /* Make an effort to preserve v0 == v1.  The target expander is able to
6632      rely on this to determine if we're permuting a single input operand.  */
6633   if (rtx_equal_p (v0, v1))
6634     {
6635       if (!insn_operand_matches (icode, 1, v0))
6636         v0 = force_reg (tmode, v0);
6637       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
6638       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
6639
6640       create_fixed_operand (&ops[1], v0);
6641       create_fixed_operand (&ops[2], v0);
6642     }
6643   else
6644     {
6645       create_input_operand (&ops[1], v0, tmode);
6646       create_input_operand (&ops[2], v1, tmode);
6647     }
6648
6649   if (maybe_expand_insn (icode, 4, ops))
6650     return ops[0].value;
6651   return NULL_RTX;
6652 }
6653
6654 /* Generate instructions for vec_perm optab given its mode
6655    and three operands.  */
6656
6657 rtx
6658 expand_vec_perm (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
6659 {
6660   enum insn_code icode;
6661   machine_mode qimode;
6662   unsigned int i, w, e, u;
6663   rtx tmp, sel_qi = NULL;
6664   rtvec vec;
6665
6666   if (!target || GET_MODE (target) != mode)
6667     target = gen_reg_rtx (mode);
6668
6669   w = GET_MODE_SIZE (mode);
6670   e = GET_MODE_NUNITS (mode);
6671   u = GET_MODE_UNIT_SIZE (mode);
6672
6673   /* Set QIMODE to a different vector mode with byte elements.
6674      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
6675   qimode = VOIDmode;
6676   if (GET_MODE_INNER (mode) != QImode)
6677     {
6678       qimode = mode_for_vector (QImode, w);
6679       if (!VECTOR_MODE_P (qimode))
6680         qimode = VOIDmode;
6681     }
6682
6683   /* If the input is a constant, expand it specially.  */
6684   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
6685   if (GET_CODE (sel) == CONST_VECTOR)
6686     {
6687       icode = direct_optab_handler (vec_perm_const_optab, mode);
6688       if (icode != CODE_FOR_nothing)
6689         {
6690           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6691           if (tmp)
6692             return tmp;
6693         }
6694
6695       /* Fall back to a constant byte-based permutation.  */
6696       if (qimode != VOIDmode)
6697         {
6698           vec = rtvec_alloc (w);
6699           for (i = 0; i < e; ++i)
6700             {
6701               unsigned int j, this_e;
6702
6703               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
6704               this_e &= 2 * e - 1;
6705               this_e *= u;
6706
6707               for (j = 0; j < u; ++j)
6708                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
6709             }
6710           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
6711
6712           icode = direct_optab_handler (vec_perm_const_optab, qimode);
6713           if (icode != CODE_FOR_nothing)
6714             {
6715               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6716               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6717                                        gen_lowpart (qimode, v1), sel_qi);
6718               if (tmp)
6719                 return gen_lowpart (mode, tmp);
6720             }
6721         }
6722     }
6723
6724   /* Otherwise expand as a fully variable permuation.  */
6725   icode = direct_optab_handler (vec_perm_optab, mode);
6726   if (icode != CODE_FOR_nothing)
6727     {
6728       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6729       if (tmp)
6730         return tmp;
6731     }
6732
6733   /* As a special case to aid several targets, lower the element-based
6734      permutation to a byte-based permutation and try again.  */
6735   if (qimode == VOIDmode)
6736     return NULL_RTX;
6737   icode = direct_optab_handler (vec_perm_optab, qimode);
6738   if (icode == CODE_FOR_nothing)
6739     return NULL_RTX;
6740
6741   if (sel_qi == NULL)
6742     {
6743       /* Multiply each element by its byte size.  */
6744       machine_mode selmode = GET_MODE (sel);
6745       if (u == 2)
6746         sel = expand_simple_binop (selmode, PLUS, sel, sel,
6747                                    sel, 0, OPTAB_DIRECT);
6748       else
6749         sel = expand_simple_binop (selmode, ASHIFT, sel,
6750                                    GEN_INT (exact_log2 (u)),
6751                                    sel, 0, OPTAB_DIRECT);
6752       gcc_assert (sel != NULL);
6753
6754       /* Broadcast the low byte each element into each of its bytes.  */
6755       vec = rtvec_alloc (w);
6756       for (i = 0; i < w; ++i)
6757         {
6758           int this_e = i / u * u;
6759           if (BYTES_BIG_ENDIAN)
6760             this_e += u - 1;
6761           RTVEC_ELT (vec, i) = GEN_INT (this_e);
6762         }
6763       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6764       sel = gen_lowpart (qimode, sel);
6765       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
6766       gcc_assert (sel != NULL);
6767
6768       /* Add the byte offset to each byte element.  */
6769       /* Note that the definition of the indicies here is memory ordering,
6770          so there should be no difference between big and little endian.  */
6771       vec = rtvec_alloc (w);
6772       for (i = 0; i < w; ++i)
6773         RTVEC_ELT (vec, i) = GEN_INT (i % u);
6774       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6775       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
6776                                     sel, 0, OPTAB_DIRECT);
6777       gcc_assert (sel_qi != NULL);
6778     }
6779
6780   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6781   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6782                            gen_lowpart (qimode, v1), sel_qi);
6783   if (tmp)
6784     tmp = gen_lowpart (mode, tmp);
6785   return tmp;
6786 }
6787
6788 /* Return insn code for a conditional operator with a comparison in
6789    mode CMODE, unsigned if UNS is true, resulting in a value of mode VMODE.  */
6790
6791 static inline enum insn_code
6792 get_vcond_icode (machine_mode vmode, machine_mode cmode, bool uns)
6793 {
6794   enum insn_code icode = CODE_FOR_nothing;
6795   if (uns)
6796     icode = convert_optab_handler (vcondu_optab, vmode, cmode);
6797   else
6798     icode = convert_optab_handler (vcond_optab, vmode, cmode);
6799   return icode;
6800 }
6801
6802 /* Return TRUE iff, appropriate vector insns are available
6803    for vector cond expr with vector type VALUE_TYPE and a comparison
6804    with operand vector types in CMP_OP_TYPE.  */
6805
6806 bool
6807 expand_vec_cond_expr_p (tree value_type, tree cmp_op_type)
6808 {
6809   machine_mode value_mode = TYPE_MODE (value_type);
6810   machine_mode cmp_op_mode = TYPE_MODE (cmp_op_type);
6811   if (GET_MODE_SIZE (value_mode) != GET_MODE_SIZE (cmp_op_mode)
6812       || GET_MODE_NUNITS (value_mode) != GET_MODE_NUNITS (cmp_op_mode)
6813       || get_vcond_icode (TYPE_MODE (value_type), TYPE_MODE (cmp_op_type),
6814                           TYPE_UNSIGNED (cmp_op_type)) == CODE_FOR_nothing)
6815     return false;
6816   return true;
6817 }
6818
6819 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
6820    three operands.  */
6821
6822 rtx
6823 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
6824                       rtx target)
6825 {
6826   struct expand_operand ops[6];
6827   enum insn_code icode;
6828   rtx comparison, rtx_op1, rtx_op2;
6829   machine_mode mode = TYPE_MODE (vec_cond_type);
6830   machine_mode cmp_op_mode;
6831   bool unsignedp;
6832   tree op0a, op0b;
6833   enum tree_code tcode;
6834
6835   if (COMPARISON_CLASS_P (op0))
6836     {
6837       op0a = TREE_OPERAND (op0, 0);
6838       op0b = TREE_OPERAND (op0, 1);
6839       tcode = TREE_CODE (op0);
6840     }
6841   else
6842     {
6843       /* Fake op0 < 0.  */
6844       gcc_assert (!TYPE_UNSIGNED (TREE_TYPE (op0)));
6845       op0a = op0;
6846       op0b = build_zero_cst (TREE_TYPE (op0));
6847       tcode = LT_EXPR;
6848     }
6849   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
6850   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
6851
6852
6853   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
6854               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
6855
6856   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
6857   if (icode == CODE_FOR_nothing)
6858     return 0;
6859
6860   comparison = vector_compare_rtx (tcode, op0a, op0b, unsignedp, icode);
6861   rtx_op1 = expand_normal (op1);
6862   rtx_op2 = expand_normal (op2);
6863
6864   create_output_operand (&ops[0], target, mode);
6865   create_input_operand (&ops[1], rtx_op1, mode);
6866   create_input_operand (&ops[2], rtx_op2, mode);
6867   create_fixed_operand (&ops[3], comparison);
6868   create_fixed_operand (&ops[4], XEXP (comparison, 0));
6869   create_fixed_operand (&ops[5], XEXP (comparison, 1));
6870   expand_insn (icode, 6, ops);
6871   return ops[0].value;
6872 }
6873
6874 /* Return non-zero if a highpart multiply is supported of can be synthisized.
6875    For the benefit of expand_mult_highpart, the return value is 1 for direct,
6876    2 for even/odd widening, and 3 for hi/lo widening.  */
6877
6878 int
6879 can_mult_highpart_p (machine_mode mode, bool uns_p)
6880 {
6881   optab op;
6882   unsigned char *sel;
6883   unsigned i, nunits;
6884
6885   op = uns_p ? umul_highpart_optab : smul_highpart_optab;
6886   if (optab_handler (op, mode) != CODE_FOR_nothing)
6887     return 1;
6888
6889   /* If the mode is an integral vector, synth from widening operations.  */
6890   if (GET_MODE_CLASS (mode) != MODE_VECTOR_INT)
6891     return 0;
6892
6893   nunits = GET_MODE_NUNITS (mode);
6894   sel = XALLOCAVEC (unsigned char, nunits);
6895
6896   op = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6897   if (optab_handler (op, mode) != CODE_FOR_nothing)
6898     {
6899       op = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6900       if (optab_handler (op, mode) != CODE_FOR_nothing)
6901         {
6902           for (i = 0; i < nunits; ++i)
6903             sel[i] = !BYTES_BIG_ENDIAN + (i & ~1) + ((i & 1) ? nunits : 0);
6904           if (can_vec_perm_p (mode, false, sel))
6905             return 2;
6906         }
6907     }
6908
6909   op = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6910   if (optab_handler (op, mode) != CODE_FOR_nothing)
6911     {
6912       op = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6913       if (optab_handler (op, mode) != CODE_FOR_nothing)
6914         {
6915           for (i = 0; i < nunits; ++i)
6916             sel[i] = 2 * i + (BYTES_BIG_ENDIAN ? 0 : 1);
6917           if (can_vec_perm_p (mode, false, sel))
6918             return 3;
6919         }
6920     }
6921
6922   return 0;
6923 }
6924
6925 /* Expand a highpart multiply.  */
6926
6927 rtx
6928 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
6929                       rtx target, bool uns_p)
6930 {
6931   struct expand_operand eops[3];
6932   enum insn_code icode;
6933   int method, i, nunits;
6934   machine_mode wmode;
6935   rtx m1, m2, perm;
6936   optab tab1, tab2;
6937   rtvec v;
6938
6939   method = can_mult_highpart_p (mode, uns_p);
6940   switch (method)
6941     {
6942     case 0:
6943       return NULL_RTX;
6944     case 1:
6945       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
6946       return expand_binop (mode, tab1, op0, op1, target, uns_p,
6947                            OPTAB_LIB_WIDEN);
6948     case 2:
6949       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6950       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6951       break;
6952     case 3:
6953       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6954       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6955       if (BYTES_BIG_ENDIAN)
6956         {
6957           optab t = tab1;
6958           tab1 = tab2;
6959           tab2 = t;
6960         }
6961       break;
6962     default:
6963       gcc_unreachable ();
6964     }
6965
6966   icode = optab_handler (tab1, mode);
6967   nunits = GET_MODE_NUNITS (mode);
6968   wmode = insn_data[icode].operand[0].mode;
6969   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
6970   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
6971
6972   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6973   create_input_operand (&eops[1], op0, mode);
6974   create_input_operand (&eops[2], op1, mode);
6975   expand_insn (icode, 3, eops);
6976   m1 = gen_lowpart (mode, eops[0].value);
6977
6978   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6979   create_input_operand (&eops[1], op0, mode);
6980   create_input_operand (&eops[2], op1, mode);
6981   expand_insn (optab_handler (tab2, mode), 3, eops);
6982   m2 = gen_lowpart (mode, eops[0].value);
6983
6984   v = rtvec_alloc (nunits);
6985   if (method == 2)
6986     {
6987       for (i = 0; i < nunits; ++i)
6988         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
6989                                     + ((i & 1) ? nunits : 0));
6990     }
6991   else
6992     {
6993       for (i = 0; i < nunits; ++i)
6994         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
6995     }
6996   perm = gen_rtx_CONST_VECTOR (mode, v);
6997
6998   return expand_vec_perm (mode, m1, m2, perm, target);
6999 }
7000
7001 /* Return true if target supports vector masked load/store for mode.  */
7002 bool
7003 can_vec_mask_load_store_p (machine_mode mode, bool is_load)
7004 {
7005   optab op = is_load ? maskload_optab : maskstore_optab;
7006   machine_mode vmode;
7007   unsigned int vector_sizes;
7008
7009   /* If mode is vector mode, check it directly.  */
7010   if (VECTOR_MODE_P (mode))
7011     return optab_handler (op, mode) != CODE_FOR_nothing;
7012
7013   /* Otherwise, return true if there is some vector mode with
7014      the mask load/store supported.  */
7015
7016   /* See if there is any chance the mask load or store might be
7017      vectorized.  If not, punt.  */
7018   vmode = targetm.vectorize.preferred_simd_mode (mode);
7019   if (!VECTOR_MODE_P (vmode))
7020     return false;
7021
7022   if (optab_handler (op, vmode) != CODE_FOR_nothing)
7023     return true;
7024
7025   vector_sizes = targetm.vectorize.autovectorize_vector_sizes ();
7026   while (vector_sizes != 0)
7027     {
7028       unsigned int cur = 1 << floor_log2 (vector_sizes);
7029       vector_sizes &= ~cur;
7030       if (cur <= GET_MODE_SIZE (mode))
7031         continue;
7032       vmode = mode_for_vector (mode, cur / GET_MODE_SIZE (mode));
7033       if (VECTOR_MODE_P (vmode)
7034           && optab_handler (op, vmode) != CODE_FOR_nothing)
7035         return true;
7036     }
7037   return false;
7038 }
7039 \f
7040 /* Return true if there is a compare_and_swap pattern.  */
7041
7042 bool
7043 can_compare_and_swap_p (machine_mode mode, bool allow_libcall)
7044 {
7045   enum insn_code icode;
7046
7047   /* Check for __atomic_compare_and_swap.  */
7048   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7049   if (icode != CODE_FOR_nothing)
7050     return true;
7051
7052   /* Check for __sync_compare_and_swap.  */
7053   icode = optab_handler (sync_compare_and_swap_optab, mode);
7054   if (icode != CODE_FOR_nothing)
7055     return true;
7056   if (allow_libcall && optab_libfunc (sync_compare_and_swap_optab, mode))
7057     return true;
7058
7059   /* No inline compare and swap.  */
7060   return false;
7061 }
7062
7063 /* Return true if an atomic exchange can be performed.  */
7064
7065 bool
7066 can_atomic_exchange_p (machine_mode mode, bool allow_libcall)
7067 {
7068   enum insn_code icode;
7069
7070   /* Check for __atomic_exchange.  */
7071   icode = direct_optab_handler (atomic_exchange_optab, mode);
7072   if (icode != CODE_FOR_nothing)
7073     return true;
7074
7075   /* Don't check __sync_test_and_set, as on some platforms that
7076      has reduced functionality.  Targets that really do support
7077      a proper exchange should simply be updated to the __atomics.  */
7078
7079   return can_compare_and_swap_p (mode, allow_libcall);
7080 }
7081
7082
7083 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
7084    pattern.  */
7085
7086 static void
7087 find_cc_set (rtx x, const_rtx pat, void *data)
7088 {
7089   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
7090       && GET_CODE (pat) == SET)
7091     {
7092       rtx *p_cc_reg = (rtx *) data;
7093       gcc_assert (!*p_cc_reg);
7094       *p_cc_reg = x;
7095     }
7096 }
7097
7098 /* This is a helper function for the other atomic operations.  This function
7099    emits a loop that contains SEQ that iterates until a compare-and-swap
7100    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
7101    a set of instructions that takes a value from OLD_REG as an input and
7102    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
7103    set to the current contents of MEM.  After SEQ, a compare-and-swap will
7104    attempt to update MEM with NEW_REG.  The function returns true when the
7105    loop was generated successfully.  */
7106
7107 static bool
7108 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
7109 {
7110   machine_mode mode = GET_MODE (mem);
7111   rtx_code_label *label;
7112   rtx cmp_reg, success, oldval;
7113
7114   /* The loop we want to generate looks like
7115
7116         cmp_reg = mem;
7117       label:
7118         old_reg = cmp_reg;
7119         seq;
7120         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
7121         if (success)
7122           goto label;
7123
7124      Note that we only do the plain load from memory once.  Subsequent
7125      iterations use the value loaded by the compare-and-swap pattern.  */
7126
7127   label = gen_label_rtx ();
7128   cmp_reg = gen_reg_rtx (mode);
7129
7130   emit_move_insn (cmp_reg, mem);
7131   emit_label (label);
7132   emit_move_insn (old_reg, cmp_reg);
7133   if (seq)
7134     emit_insn (seq);
7135
7136   success = NULL_RTX;
7137   oldval = cmp_reg;
7138   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
7139                                        new_reg, false, MEMMODEL_SEQ_CST,
7140                                        MEMMODEL_RELAXED))
7141     return false;
7142
7143   if (oldval != cmp_reg)
7144     emit_move_insn (cmp_reg, oldval);
7145
7146   /* Mark this jump predicted not taken.  */
7147   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
7148                            GET_MODE (success), 1, label, 0);
7149   return true;
7150 }
7151
7152
7153 /* This function tries to emit an atomic_exchange intruction.  VAL is written
7154    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
7155    using TARGET if possible.  */
7156
7157 static rtx
7158 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7159 {
7160   machine_mode mode = GET_MODE (mem);
7161   enum insn_code icode;
7162
7163   /* If the target supports the exchange directly, great.  */
7164   icode = direct_optab_handler (atomic_exchange_optab, mode);
7165   if (icode != CODE_FOR_nothing)
7166     {
7167       struct expand_operand ops[4];
7168
7169       create_output_operand (&ops[0], target, mode);
7170       create_fixed_operand (&ops[1], mem);
7171       create_input_operand (&ops[2], val, mode);
7172       create_integer_operand (&ops[3], model);
7173       if (maybe_expand_insn (icode, 4, ops))
7174         return ops[0].value;
7175     }
7176
7177   return NULL_RTX;
7178 }
7179
7180 /* This function tries to implement an atomic exchange operation using
7181    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
7182    The previous contents of *MEM are returned, using TARGET if possible.
7183    Since this instructionn is an acquire barrier only, stronger memory
7184    models may require additional barriers to be emitted.  */
7185
7186 static rtx
7187 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
7188                                    enum memmodel model)
7189 {
7190   machine_mode mode = GET_MODE (mem);
7191   enum insn_code icode;
7192   rtx_insn *last_insn = get_last_insn ();
7193
7194   icode = optab_handler (sync_lock_test_and_set_optab, mode);
7195
7196   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
7197      exists, and the memory model is stronger than acquire, add a release
7198      barrier before the instruction.  */
7199
7200   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST
7201       || (model & MEMMODEL_MASK) == MEMMODEL_RELEASE
7202       || (model & MEMMODEL_MASK) == MEMMODEL_ACQ_REL)
7203     expand_mem_thread_fence (model);
7204
7205   if (icode != CODE_FOR_nothing)
7206     {
7207       struct expand_operand ops[3];
7208       create_output_operand (&ops[0], target, mode);
7209       create_fixed_operand (&ops[1], mem);
7210       create_input_operand (&ops[2], val, mode);
7211       if (maybe_expand_insn (icode, 3, ops))
7212         return ops[0].value;
7213     }
7214
7215   /* If an external test-and-set libcall is provided, use that instead of
7216      any external compare-and-swap that we might get from the compare-and-
7217      swap-loop expansion later.  */
7218   if (!can_compare_and_swap_p (mode, false))
7219     {
7220       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
7221       if (libfunc != NULL)
7222         {
7223           rtx addr;
7224
7225           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7226           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7227                                           mode, 2, addr, ptr_mode,
7228                                           val, mode);
7229         }
7230     }
7231
7232   /* If the test_and_set can't be emitted, eliminate any barrier that might
7233      have been emitted.  */
7234   delete_insns_since (last_insn);
7235   return NULL_RTX;
7236 }
7237
7238 /* This function tries to implement an atomic exchange operation using a
7239    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
7240    *MEM are returned, using TARGET if possible.  No memory model is required
7241    since a compare_and_swap loop is seq-cst.  */
7242
7243 static rtx
7244 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
7245 {
7246   machine_mode mode = GET_MODE (mem);
7247
7248   if (can_compare_and_swap_p (mode, true))
7249     {
7250       if (!target || !register_operand (target, mode))
7251         target = gen_reg_rtx (mode);
7252       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
7253         return target;
7254     }
7255
7256   return NULL_RTX;
7257 }
7258
7259 /* This function tries to implement an atomic test-and-set operation
7260    using the atomic_test_and_set instruction pattern.  A boolean value
7261    is returned from the operation, using TARGET if possible.  */
7262
7263 #ifndef HAVE_atomic_test_and_set
7264 #define HAVE_atomic_test_and_set 0
7265 #define CODE_FOR_atomic_test_and_set CODE_FOR_nothing
7266 #endif
7267
7268 static rtx
7269 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7270 {
7271   machine_mode pat_bool_mode;
7272   struct expand_operand ops[3];
7273
7274   if (!HAVE_atomic_test_and_set)
7275     return NULL_RTX;
7276
7277   /* While we always get QImode from __atomic_test_and_set, we get
7278      other memory modes from __sync_lock_test_and_set.  Note that we
7279      use no endian adjustment here.  This matches the 4.6 behavior
7280      in the Sparc backend.  */
7281   gcc_checking_assert
7282     (insn_data[CODE_FOR_atomic_test_and_set].operand[1].mode == QImode);
7283   if (GET_MODE (mem) != QImode)
7284     mem = adjust_address_nv (mem, QImode, 0);
7285
7286   pat_bool_mode = insn_data[CODE_FOR_atomic_test_and_set].operand[0].mode;
7287   create_output_operand (&ops[0], target, pat_bool_mode);
7288   create_fixed_operand (&ops[1], mem);
7289   create_integer_operand (&ops[2], model);
7290
7291   if (maybe_expand_insn (CODE_FOR_atomic_test_and_set, 3, ops))
7292     return ops[0].value;
7293   return NULL_RTX;
7294 }
7295
7296 /* This function expands the legacy _sync_lock test_and_set operation which is
7297    generally an atomic exchange.  Some limited targets only allow the
7298    constant 1 to be stored.  This is an ACQUIRE operation.
7299
7300    TARGET is an optional place to stick the return value.
7301    MEM is where VAL is stored.  */
7302
7303 rtx
7304 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
7305 {
7306   rtx ret;
7307
7308   /* Try an atomic_exchange first.  */
7309   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_ACQUIRE);
7310   if (ret)
7311     return ret;
7312
7313   ret = maybe_emit_sync_lock_test_and_set (target, mem, val, MEMMODEL_ACQUIRE);
7314   if (ret)
7315     return ret;
7316
7317   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7318   if (ret)
7319     return ret;
7320
7321   /* If there are no other options, try atomic_test_and_set if the value
7322      being stored is 1.  */
7323   if (val == const1_rtx)
7324     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_ACQUIRE);
7325
7326   return ret;
7327 }
7328
7329 /* This function expands the atomic test_and_set operation:
7330    atomically store a boolean TRUE into MEM and return the previous value.
7331
7332    MEMMODEL is the memory model variant to use.
7333    TARGET is an optional place to stick the return value.  */
7334
7335 rtx
7336 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7337 {
7338   machine_mode mode = GET_MODE (mem);
7339   rtx ret, trueval, subtarget;
7340
7341   ret = maybe_emit_atomic_test_and_set (target, mem, model);
7342   if (ret)
7343     return ret;
7344
7345   /* Be binary compatible with non-default settings of trueval, and different
7346      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
7347      another only has atomic-exchange.  */
7348   if (targetm.atomic_test_and_set_trueval == 1)
7349     {
7350       trueval = const1_rtx;
7351       subtarget = target ? target : gen_reg_rtx (mode);
7352     }
7353   else
7354     {
7355       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
7356       subtarget = gen_reg_rtx (mode);
7357     }
7358
7359   /* Try the atomic-exchange optab...  */
7360   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
7361
7362   /* ... then an atomic-compare-and-swap loop ... */
7363   if (!ret)
7364     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
7365
7366   /* ... before trying the vaguely defined legacy lock_test_and_set. */
7367   if (!ret)
7368     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
7369
7370   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
7371      things with the value 1.  Thus we try again without trueval.  */
7372   if (!ret && targetm.atomic_test_and_set_trueval != 1)
7373     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
7374
7375   /* Failing all else, assume a single threaded environment and simply
7376      perform the operation.  */
7377   if (!ret)
7378     {
7379       /* If the result is ignored skip the move to target.  */
7380       if (subtarget != const0_rtx)
7381         emit_move_insn (subtarget, mem);
7382
7383       emit_move_insn (mem, trueval);
7384       ret = subtarget;
7385     }
7386
7387   /* Recall that have to return a boolean value; rectify if trueval
7388      is not exactly one.  */
7389   if (targetm.atomic_test_and_set_trueval != 1)
7390     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
7391
7392   return ret;
7393 }
7394
7395 /* This function expands the atomic exchange operation:
7396    atomically store VAL in MEM and return the previous value in MEM.
7397
7398    MEMMODEL is the memory model variant to use.
7399    TARGET is an optional place to stick the return value.  */
7400
7401 rtx
7402 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7403 {
7404   rtx ret;
7405
7406   ret = maybe_emit_atomic_exchange (target, mem, val, model);
7407
7408   /* Next try a compare-and-swap loop for the exchange.  */
7409   if (!ret)
7410     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7411
7412   return ret;
7413 }
7414
7415 /* This function expands the atomic compare exchange operation:
7416
7417    *PTARGET_BOOL is an optional place to store the boolean success/failure.
7418    *PTARGET_OVAL is an optional place to store the old value from memory.
7419    Both target parameters may be NULL to indicate that we do not care about
7420    that return value.  Both target parameters are updated on success to
7421    the actual location of the corresponding result.
7422
7423    MEMMODEL is the memory model variant to use.
7424
7425    The return value of the function is true for success.  */
7426
7427 bool
7428 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
7429                                 rtx mem, rtx expected, rtx desired,
7430                                 bool is_weak, enum memmodel succ_model,
7431                                 enum memmodel fail_model)
7432 {
7433   machine_mode mode = GET_MODE (mem);
7434   struct expand_operand ops[8];
7435   enum insn_code icode;
7436   rtx target_oval, target_bool = NULL_RTX;
7437   rtx libfunc;
7438
7439   /* Load expected into a register for the compare and swap.  */
7440   if (MEM_P (expected))
7441     expected = copy_to_reg (expected);
7442
7443   /* Make sure we always have some place to put the return oldval.
7444      Further, make sure that place is distinct from the input expected,
7445      just in case we need that path down below.  */
7446   if (ptarget_oval == NULL
7447       || (target_oval = *ptarget_oval) == NULL
7448       || reg_overlap_mentioned_p (expected, target_oval))
7449     target_oval = gen_reg_rtx (mode);
7450
7451   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7452   if (icode != CODE_FOR_nothing)
7453     {
7454       machine_mode bool_mode = insn_data[icode].operand[0].mode;
7455
7456       /* Make sure we always have a place for the bool operand.  */
7457       if (ptarget_bool == NULL
7458           || (target_bool = *ptarget_bool) == NULL
7459           || GET_MODE (target_bool) != bool_mode)
7460         target_bool = gen_reg_rtx (bool_mode);
7461
7462       /* Emit the compare_and_swap.  */
7463       create_output_operand (&ops[0], target_bool, bool_mode);
7464       create_output_operand (&ops[1], target_oval, mode);
7465       create_fixed_operand (&ops[2], mem);
7466       create_input_operand (&ops[3], expected, mode);
7467       create_input_operand (&ops[4], desired, mode);
7468       create_integer_operand (&ops[5], is_weak);
7469       create_integer_operand (&ops[6], succ_model);
7470       create_integer_operand (&ops[7], fail_model);
7471       if (maybe_expand_insn (icode, 8, ops))
7472         {
7473           /* Return success/failure.  */
7474           target_bool = ops[0].value;
7475           target_oval = ops[1].value;
7476           goto success;
7477         }
7478     }
7479
7480   /* Otherwise fall back to the original __sync_val_compare_and_swap
7481      which is always seq-cst.  */
7482   icode = optab_handler (sync_compare_and_swap_optab, mode);
7483   if (icode != CODE_FOR_nothing)
7484     {
7485       rtx cc_reg;
7486
7487       create_output_operand (&ops[0], target_oval, mode);
7488       create_fixed_operand (&ops[1], mem);
7489       create_input_operand (&ops[2], expected, mode);
7490       create_input_operand (&ops[3], desired, mode);
7491       if (!maybe_expand_insn (icode, 4, ops))
7492         return false;
7493
7494       target_oval = ops[0].value;
7495
7496       /* If the caller isn't interested in the boolean return value,
7497          skip the computation of it.  */
7498       if (ptarget_bool == NULL)
7499         goto success;
7500
7501       /* Otherwise, work out if the compare-and-swap succeeded.  */
7502       cc_reg = NULL_RTX;
7503       if (have_insn_for (COMPARE, CCmode))
7504         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
7505       if (cc_reg)
7506         {
7507           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
7508                                                const0_rtx, VOIDmode, 0, 1);
7509           goto success;
7510         }
7511       goto success_bool_from_val;
7512     }
7513
7514   /* Also check for library support for __sync_val_compare_and_swap.  */
7515   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
7516   if (libfunc != NULL)
7517     {
7518       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7519       target_oval = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7520                                              mode, 3, addr, ptr_mode,
7521                                              expected, mode, desired, mode);
7522
7523       /* Compute the boolean return value only if requested.  */
7524       if (ptarget_bool)
7525         goto success_bool_from_val;
7526       else
7527         goto success;
7528     }
7529
7530   /* Failure.  */
7531   return false;
7532
7533  success_bool_from_val:
7534    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
7535                                         expected, VOIDmode, 1, 1);
7536  success:
7537   /* Make sure that the oval output winds up where the caller asked.  */
7538   if (ptarget_oval)
7539     *ptarget_oval = target_oval;
7540   if (ptarget_bool)
7541     *ptarget_bool = target_bool;
7542   return true;
7543 }
7544
7545 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
7546
7547 static void
7548 expand_asm_memory_barrier (void)
7549 {
7550   rtx asm_op, clob;
7551
7552   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, empty_string, empty_string, 0,
7553                                  rtvec_alloc (0), rtvec_alloc (0),
7554                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7555   MEM_VOLATILE_P (asm_op) = 1;
7556
7557   clob = gen_rtx_SCRATCH (VOIDmode);
7558   clob = gen_rtx_MEM (BLKmode, clob);
7559   clob = gen_rtx_CLOBBER (VOIDmode, clob);
7560
7561   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
7562 }
7563
7564 /* This routine will either emit the mem_thread_fence pattern or issue a
7565    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7566
7567 #ifndef HAVE_mem_thread_fence
7568 # define HAVE_mem_thread_fence 0
7569 # define gen_mem_thread_fence(x) (gcc_unreachable (), NULL_RTX)
7570 #endif
7571 #ifndef HAVE_memory_barrier
7572 # define HAVE_memory_barrier 0
7573 # define gen_memory_barrier()  (gcc_unreachable (), NULL_RTX)
7574 #endif
7575
7576 void
7577 expand_mem_thread_fence (enum memmodel model)
7578 {
7579   if (HAVE_mem_thread_fence)
7580     emit_insn (gen_mem_thread_fence (GEN_INT (model)));
7581   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7582     {
7583       if (HAVE_memory_barrier)
7584         emit_insn (gen_memory_barrier ());
7585       else if (synchronize_libfunc != NULL_RTX)
7586         emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
7587       else
7588         expand_asm_memory_barrier ();
7589     }
7590 }
7591
7592 /* This routine will either emit the mem_signal_fence pattern or issue a
7593    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7594
7595 #ifndef HAVE_mem_signal_fence
7596 # define HAVE_mem_signal_fence 0
7597 # define gen_mem_signal_fence(x) (gcc_unreachable (), NULL_RTX)
7598 #endif
7599
7600 void
7601 expand_mem_signal_fence (enum memmodel model)
7602 {
7603   if (HAVE_mem_signal_fence)
7604     emit_insn (gen_mem_signal_fence (GEN_INT (model)));
7605   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7606     {
7607       /* By default targets are coherent between a thread and the signal
7608          handler running on the same thread.  Thus this really becomes a
7609          compiler barrier, in that stores must not be sunk past
7610          (or raised above) a given point.  */
7611       expand_asm_memory_barrier ();
7612     }
7613 }
7614
7615 /* This function expands the atomic load operation:
7616    return the atomically loaded value in MEM.
7617
7618    MEMMODEL is the memory model variant to use.
7619    TARGET is an option place to stick the return value.  */
7620
7621 rtx
7622 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
7623 {
7624   machine_mode mode = GET_MODE (mem);
7625   enum insn_code icode;
7626
7627   /* If the target supports the load directly, great.  */
7628   icode = direct_optab_handler (atomic_load_optab, mode);
7629   if (icode != CODE_FOR_nothing)
7630     {
7631       struct expand_operand ops[3];
7632
7633       create_output_operand (&ops[0], target, mode);
7634       create_fixed_operand (&ops[1], mem);
7635       create_integer_operand (&ops[2], model);
7636       if (maybe_expand_insn (icode, 3, ops))
7637         return ops[0].value;
7638     }
7639
7640   /* If the size of the object is greater than word size on this target,
7641      then we assume that a load will not be atomic.  */
7642   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7643     {
7644       /* Issue val = compare_and_swap (mem, 0, 0).
7645          This may cause the occasional harmless store of 0 when the value is
7646          already 0, but it seems to be OK according to the standards guys.  */
7647       if (expand_atomic_compare_and_swap (NULL, &target, mem, const0_rtx,
7648                                           const0_rtx, false, model, model))
7649         return target;
7650       else
7651       /* Otherwise there is no atomic load, leave the library call.  */
7652         return NULL_RTX;
7653     }
7654
7655   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
7656   if (!target || target == const0_rtx)
7657     target = gen_reg_rtx (mode);
7658
7659   /* For SEQ_CST, emit a barrier before the load.  */
7660   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7661     expand_mem_thread_fence (model);
7662
7663   emit_move_insn (target, mem);
7664
7665   /* Emit the appropriate barrier after the load.  */
7666   expand_mem_thread_fence (model);
7667
7668   return target;
7669 }
7670
7671 /* This function expands the atomic store operation:
7672    Atomically store VAL in MEM.
7673    MEMMODEL is the memory model variant to use.
7674    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
7675    function returns const0_rtx if a pattern was emitted.  */
7676
7677 rtx
7678 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
7679 {
7680   machine_mode mode = GET_MODE (mem);
7681   enum insn_code icode;
7682   struct expand_operand ops[3];
7683
7684   /* If the target supports the store directly, great.  */
7685   icode = direct_optab_handler (atomic_store_optab, mode);
7686   if (icode != CODE_FOR_nothing)
7687     {
7688       create_fixed_operand (&ops[0], mem);
7689       create_input_operand (&ops[1], val, mode);
7690       create_integer_operand (&ops[2], model);
7691       if (maybe_expand_insn (icode, 3, ops))
7692         return const0_rtx;
7693     }
7694
7695   /* If using __sync_lock_release is a viable alternative, try it.  */
7696   if (use_release)
7697     {
7698       icode = direct_optab_handler (sync_lock_release_optab, mode);
7699       if (icode != CODE_FOR_nothing)
7700         {
7701           create_fixed_operand (&ops[0], mem);
7702           create_input_operand (&ops[1], const0_rtx, mode);
7703           if (maybe_expand_insn (icode, 2, ops))
7704             {
7705               /* lock_release is only a release barrier.  */
7706               if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7707                 expand_mem_thread_fence (model);
7708               return const0_rtx;
7709             }
7710         }
7711     }
7712
7713   /* If the size of the object is greater than word size on this target,
7714      a default store will not be atomic, Try a mem_exchange and throw away
7715      the result.  If that doesn't work, don't do anything.  */
7716   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7717     {
7718       rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
7719       if (!target)
7720         target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem, val);
7721       if (target)
7722         return const0_rtx;
7723       else
7724         return NULL_RTX;
7725     }
7726
7727   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
7728   expand_mem_thread_fence (model);
7729
7730   emit_move_insn (mem, val);
7731
7732   /* For SEQ_CST, also emit a barrier after the store.  */
7733   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7734     expand_mem_thread_fence (model);
7735
7736   return const0_rtx;
7737 }
7738
7739
7740 /* Structure containing the pointers and values required to process the
7741    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
7742
7743 struct atomic_op_functions
7744 {
7745   direct_optab mem_fetch_before;
7746   direct_optab mem_fetch_after;
7747   direct_optab mem_no_result;
7748   optab fetch_before;
7749   optab fetch_after;
7750   direct_optab no_result;
7751   enum rtx_code reverse_code;
7752 };
7753
7754
7755 /* Fill in structure pointed to by OP with the various optab entries for an
7756    operation of type CODE.  */
7757
7758 static void
7759 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
7760 {
7761   gcc_assert (op!= NULL);
7762
7763   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
7764      in the source code during compilation, and the optab entries are not
7765      computable until runtime.  Fill in the values at runtime.  */
7766   switch (code)
7767     {
7768     case PLUS:
7769       op->mem_fetch_before = atomic_fetch_add_optab;
7770       op->mem_fetch_after = atomic_add_fetch_optab;
7771       op->mem_no_result = atomic_add_optab;
7772       op->fetch_before = sync_old_add_optab;
7773       op->fetch_after = sync_new_add_optab;
7774       op->no_result = sync_add_optab;
7775       op->reverse_code = MINUS;
7776       break;
7777     case MINUS:
7778       op->mem_fetch_before = atomic_fetch_sub_optab;
7779       op->mem_fetch_after = atomic_sub_fetch_optab;
7780       op->mem_no_result = atomic_sub_optab;
7781       op->fetch_before = sync_old_sub_optab;
7782       op->fetch_after = sync_new_sub_optab;
7783       op->no_result = sync_sub_optab;
7784       op->reverse_code = PLUS;
7785       break;
7786     case XOR:
7787       op->mem_fetch_before = atomic_fetch_xor_optab;
7788       op->mem_fetch_after = atomic_xor_fetch_optab;
7789       op->mem_no_result = atomic_xor_optab;
7790       op->fetch_before = sync_old_xor_optab;
7791       op->fetch_after = sync_new_xor_optab;
7792       op->no_result = sync_xor_optab;
7793       op->reverse_code = XOR;
7794       break;
7795     case AND:
7796       op->mem_fetch_before = atomic_fetch_and_optab;
7797       op->mem_fetch_after = atomic_and_fetch_optab;
7798       op->mem_no_result = atomic_and_optab;
7799       op->fetch_before = sync_old_and_optab;
7800       op->fetch_after = sync_new_and_optab;
7801       op->no_result = sync_and_optab;
7802       op->reverse_code = UNKNOWN;
7803       break;
7804     case IOR:
7805       op->mem_fetch_before = atomic_fetch_or_optab;
7806       op->mem_fetch_after = atomic_or_fetch_optab;
7807       op->mem_no_result = atomic_or_optab;
7808       op->fetch_before = sync_old_ior_optab;
7809       op->fetch_after = sync_new_ior_optab;
7810       op->no_result = sync_ior_optab;
7811       op->reverse_code = UNKNOWN;
7812       break;
7813     case NOT:
7814       op->mem_fetch_before = atomic_fetch_nand_optab;
7815       op->mem_fetch_after = atomic_nand_fetch_optab;
7816       op->mem_no_result = atomic_nand_optab;
7817       op->fetch_before = sync_old_nand_optab;
7818       op->fetch_after = sync_new_nand_optab;
7819       op->no_result = sync_nand_optab;
7820       op->reverse_code = UNKNOWN;
7821       break;
7822     default:
7823       gcc_unreachable ();
7824     }
7825 }
7826
7827 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
7828    using memory order MODEL.  If AFTER is true the operation needs to return
7829    the value of *MEM after the operation, otherwise the previous value.
7830    TARGET is an optional place to place the result.  The result is unused if
7831    it is const0_rtx.
7832    Return the result if there is a better sequence, otherwise NULL_RTX.  */
7833
7834 static rtx
7835 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7836                          enum memmodel model, bool after)
7837 {
7838   /* If the value is prefetched, or not used, it may be possible to replace
7839      the sequence with a native exchange operation.  */
7840   if (!after || target == const0_rtx)
7841     {
7842       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
7843       if (code == AND && val == const0_rtx)
7844         {
7845           if (target == const0_rtx)
7846             target = gen_reg_rtx (GET_MODE (mem));
7847           return maybe_emit_atomic_exchange (target, mem, val, model);
7848         }
7849
7850       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
7851       if (code == IOR && val == constm1_rtx)
7852         {
7853           if (target == const0_rtx)
7854             target = gen_reg_rtx (GET_MODE (mem));
7855           return maybe_emit_atomic_exchange (target, mem, val, model);
7856         }
7857     }
7858
7859   return NULL_RTX;
7860 }
7861
7862 /* Try to emit an instruction for a specific operation varaition.
7863    OPTAB contains the OP functions.
7864    TARGET is an optional place to return the result. const0_rtx means unused.
7865    MEM is the memory location to operate on.
7866    VAL is the value to use in the operation.
7867    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
7868    MODEL is the memory model, if used.
7869    AFTER is true if the returned result is the value after the operation.  */
7870
7871 static rtx
7872 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
7873                rtx val, bool use_memmodel, enum memmodel model, bool after)
7874 {
7875   machine_mode mode = GET_MODE (mem);
7876   struct expand_operand ops[4];
7877   enum insn_code icode;
7878   int op_counter = 0;
7879   int num_ops;
7880
7881   /* Check to see if there is a result returned.  */
7882   if (target == const0_rtx)
7883     {
7884       if (use_memmodel)
7885         {
7886           icode = direct_optab_handler (optab->mem_no_result, mode);
7887           create_integer_operand (&ops[2], model);
7888           num_ops = 3;
7889         }
7890       else
7891         {
7892           icode = direct_optab_handler (optab->no_result, mode);
7893           num_ops = 2;
7894         }
7895     }
7896   /* Otherwise, we need to generate a result.  */
7897   else
7898     {
7899       if (use_memmodel)
7900         {
7901           icode = direct_optab_handler (after ? optab->mem_fetch_after
7902                                         : optab->mem_fetch_before, mode);
7903           create_integer_operand (&ops[3], model);
7904           num_ops = 4;
7905         }
7906       else
7907         {
7908           icode = optab_handler (after ? optab->fetch_after
7909                                  : optab->fetch_before, mode);
7910           num_ops = 3;
7911         }
7912       create_output_operand (&ops[op_counter++], target, mode);
7913     }
7914   if (icode == CODE_FOR_nothing)
7915     return NULL_RTX;
7916
7917   create_fixed_operand (&ops[op_counter++], mem);
7918   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
7919   create_convert_operand_to (&ops[op_counter++], val, mode, true);
7920
7921   if (maybe_expand_insn (icode, num_ops, ops))
7922     return (target == const0_rtx ? const0_rtx : ops[0].value);
7923
7924   return NULL_RTX;
7925 }
7926
7927
7928 /* This function expands an atomic fetch_OP or OP_fetch operation:
7929    TARGET is an option place to stick the return value.  const0_rtx indicates
7930    the result is unused.
7931    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7932    CODE is the operation being performed (OP)
7933    MEMMODEL is the memory model variant to use.
7934    AFTER is true to return the result of the operation (OP_fetch).
7935    AFTER is false to return the value before the operation (fetch_OP).
7936
7937    This function will *only* generate instructions if there is a direct
7938    optab. No compare and swap loops or libcalls will be generated. */
7939
7940 static rtx
7941 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
7942                                     enum rtx_code code, enum memmodel model,
7943                                     bool after)
7944 {
7945   machine_mode mode = GET_MODE (mem);
7946   struct atomic_op_functions optab;
7947   rtx result;
7948   bool unused_result = (target == const0_rtx);
7949
7950   get_atomic_op_for_code (&optab, code);
7951
7952   /* Check to see if there are any better instructions.  */
7953   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
7954   if (result)
7955     return result;
7956
7957   /* Check for the case where the result isn't used and try those patterns.  */
7958   if (unused_result)
7959     {
7960       /* Try the memory model variant first.  */
7961       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
7962       if (result)
7963         return result;
7964
7965       /* Next try the old style withuot a memory model.  */
7966       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
7967       if (result)
7968         return result;
7969
7970       /* There is no no-result pattern, so try patterns with a result.  */
7971       target = NULL_RTX;
7972     }
7973
7974   /* Try the __atomic version.  */
7975   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
7976   if (result)
7977     return result;
7978
7979   /* Try the older __sync version.  */
7980   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
7981   if (result)
7982     return result;
7983
7984   /* If the fetch value can be calculated from the other variation of fetch,
7985      try that operation.  */
7986   if (after || unused_result || optab.reverse_code != UNKNOWN)
7987     {
7988       /* Try the __atomic version, then the older __sync version.  */
7989       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
7990       if (!result)
7991         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
7992
7993       if (result)
7994         {
7995           /* If the result isn't used, no need to do compensation code.  */
7996           if (unused_result)
7997             return result;
7998
7999           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
8000              Fetch_before == after REVERSE_OP val.  */
8001           if (!after)
8002             code = optab.reverse_code;
8003           if (code == NOT)
8004             {
8005               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
8006                                             true, OPTAB_LIB_WIDEN);
8007               result = expand_simple_unop (mode, NOT, result, target, true);
8008             }
8009           else
8010             result = expand_simple_binop (mode, code, result, val, target,
8011                                           true, OPTAB_LIB_WIDEN);
8012           return result;
8013         }
8014     }
8015
8016   /* No direct opcode can be generated.  */
8017   return NULL_RTX;
8018 }
8019
8020
8021
8022 /* This function expands an atomic fetch_OP or OP_fetch operation:
8023    TARGET is an option place to stick the return value.  const0_rtx indicates
8024    the result is unused.
8025    atomically fetch MEM, perform the operation with VAL and return it to MEM.
8026    CODE is the operation being performed (OP)
8027    MEMMODEL is the memory model variant to use.
8028    AFTER is true to return the result of the operation (OP_fetch).
8029    AFTER is false to return the value before the operation (fetch_OP).  */
8030 rtx
8031 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
8032                         enum memmodel model, bool after)
8033 {
8034   machine_mode mode = GET_MODE (mem);
8035   rtx result;
8036   bool unused_result = (target == const0_rtx);
8037
8038   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
8039                                                after);
8040
8041   if (result)
8042     return result;
8043
8044   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
8045   if (code == PLUS || code == MINUS)
8046     {
8047       rtx tmp;
8048       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
8049
8050       start_sequence ();
8051       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
8052       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
8053                                                    model, after);
8054       if (result)
8055         {
8056           /* PLUS worked so emit the insns and return.  */
8057           tmp = get_insns ();
8058           end_sequence ();
8059           emit_insn (tmp);
8060           return result;
8061         }
8062
8063       /* PLUS did not work, so throw away the negation code and continue.  */
8064       end_sequence ();
8065     }
8066
8067   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
8068   if (!can_compare_and_swap_p (mode, false))
8069     {
8070       rtx libfunc;
8071       bool fixup = false;
8072       enum rtx_code orig_code = code;
8073       struct atomic_op_functions optab;
8074
8075       get_atomic_op_for_code (&optab, code);
8076       libfunc = optab_libfunc (after ? optab.fetch_after
8077                                : optab.fetch_before, mode);
8078       if (libfunc == NULL
8079           && (after || unused_result || optab.reverse_code != UNKNOWN))
8080         {
8081           fixup = true;
8082           if (!after)
8083             code = optab.reverse_code;
8084           libfunc = optab_libfunc (after ? optab.fetch_before
8085                                    : optab.fetch_after, mode);
8086         }
8087       if (libfunc != NULL)
8088         {
8089           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
8090           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
8091                                             2, addr, ptr_mode, val, mode);
8092
8093           if (!unused_result && fixup)
8094             result = expand_simple_binop (mode, code, result, val, target,
8095                                           true, OPTAB_LIB_WIDEN);
8096           return result;
8097         }
8098
8099       /* We need the original code for any further attempts.  */
8100       code = orig_code;
8101     }
8102
8103   /* If nothing else has succeeded, default to a compare and swap loop.  */
8104   if (can_compare_and_swap_p (mode, true))
8105     {
8106       rtx_insn *insn;
8107       rtx t0 = gen_reg_rtx (mode), t1;
8108
8109       start_sequence ();
8110
8111       /* If the result is used, get a register for it.  */
8112       if (!unused_result)
8113         {
8114           if (!target || !register_operand (target, mode))
8115             target = gen_reg_rtx (mode);
8116           /* If fetch_before, copy the value now.  */
8117           if (!after)
8118             emit_move_insn (target, t0);
8119         }
8120       else
8121         target = const0_rtx;
8122
8123       t1 = t0;
8124       if (code == NOT)
8125         {
8126           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
8127                                     true, OPTAB_LIB_WIDEN);
8128           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
8129         }
8130       else
8131         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
8132                                   OPTAB_LIB_WIDEN);
8133
8134       /* For after, copy the value now.  */
8135       if (!unused_result && after)
8136         emit_move_insn (target, t1);
8137       insn = get_insns ();
8138       end_sequence ();
8139
8140       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
8141         return target;
8142     }
8143
8144   return NULL_RTX;
8145 }
8146 \f
8147 /* Return true if OPERAND is suitable for operand number OPNO of
8148    instruction ICODE.  */
8149
8150 bool
8151 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
8152 {
8153   return (!insn_data[(int) icode].operand[opno].predicate
8154           || (insn_data[(int) icode].operand[opno].predicate
8155               (operand, insn_data[(int) icode].operand[opno].mode)));
8156 }
8157 \f
8158 /* TARGET is a target of a multiword operation that we are going to
8159    implement as a series of word-mode operations.  Return true if
8160    TARGET is suitable for this purpose.  */
8161
8162 bool
8163 valid_multiword_target_p (rtx target)
8164 {
8165   machine_mode mode;
8166   int i;
8167
8168   mode = GET_MODE (target);
8169   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
8170     if (!validate_subreg (word_mode, mode, target, i))
8171       return false;
8172   return true;
8173 }
8174
8175 /* Like maybe_legitimize_operand, but do not change the code of the
8176    current rtx value.  */
8177
8178 static bool
8179 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
8180                                     struct expand_operand *op)
8181 {
8182   /* See if the operand matches in its current form.  */
8183   if (insn_operand_matches (icode, opno, op->value))
8184     return true;
8185
8186   /* If the operand is a memory whose address has no side effects,
8187      try forcing the address into a non-virtual pseudo register.
8188      The check for side effects is important because copy_to_mode_reg
8189      cannot handle things like auto-modified addresses.  */
8190   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
8191     {
8192       rtx addr, mem;
8193
8194       mem = op->value;
8195       addr = XEXP (mem, 0);
8196       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
8197           && !side_effects_p (addr))
8198         {
8199           rtx_insn *last;
8200           machine_mode mode;
8201
8202           last = get_last_insn ();
8203           mode = get_address_mode (mem);
8204           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
8205           if (insn_operand_matches (icode, opno, mem))
8206             {
8207               op->value = mem;
8208               return true;
8209             }
8210           delete_insns_since (last);
8211         }
8212     }
8213
8214   return false;
8215 }
8216
8217 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
8218    on success, storing the new operand value back in OP.  */
8219
8220 static bool
8221 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
8222                           struct expand_operand *op)
8223 {
8224   machine_mode mode, imode;
8225   bool old_volatile_ok, result;
8226
8227   mode = op->mode;
8228   switch (op->type)
8229     {
8230     case EXPAND_FIXED:
8231       old_volatile_ok = volatile_ok;
8232       volatile_ok = true;
8233       result = maybe_legitimize_operand_same_code (icode, opno, op);
8234       volatile_ok = old_volatile_ok;
8235       return result;
8236
8237     case EXPAND_OUTPUT:
8238       gcc_assert (mode != VOIDmode);
8239       if (op->value
8240           && op->value != const0_rtx
8241           && GET_MODE (op->value) == mode
8242           && maybe_legitimize_operand_same_code (icode, opno, op))
8243         return true;
8244
8245       op->value = gen_reg_rtx (mode);
8246       break;
8247
8248     case EXPAND_INPUT:
8249     input:
8250       gcc_assert (mode != VOIDmode);
8251       gcc_assert (GET_MODE (op->value) == VOIDmode
8252                   || GET_MODE (op->value) == mode);
8253       if (maybe_legitimize_operand_same_code (icode, opno, op))
8254         return true;
8255
8256       op->value = copy_to_mode_reg (mode, op->value);
8257       break;
8258
8259     case EXPAND_CONVERT_TO:
8260       gcc_assert (mode != VOIDmode);
8261       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
8262       goto input;
8263
8264     case EXPAND_CONVERT_FROM:
8265       if (GET_MODE (op->value) != VOIDmode)
8266         mode = GET_MODE (op->value);
8267       else
8268         /* The caller must tell us what mode this value has.  */
8269         gcc_assert (mode != VOIDmode);
8270
8271       imode = insn_data[(int) icode].operand[opno].mode;
8272       if (imode != VOIDmode && imode != mode)
8273         {
8274           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
8275           mode = imode;
8276         }
8277       goto input;
8278
8279     case EXPAND_ADDRESS:
8280       gcc_assert (mode != VOIDmode);
8281       op->value = convert_memory_address (mode, op->value);
8282       goto input;
8283
8284     case EXPAND_INTEGER:
8285       mode = insn_data[(int) icode].operand[opno].mode;
8286       if (mode != VOIDmode && const_int_operand (op->value, mode))
8287         goto input;
8288       break;
8289     }
8290   return insn_operand_matches (icode, opno, op->value);
8291 }
8292
8293 /* Make OP describe an input operand that should have the same value
8294    as VALUE, after any mode conversion that the target might request.
8295    TYPE is the type of VALUE.  */
8296
8297 void
8298 create_convert_operand_from_type (struct expand_operand *op,
8299                                   rtx value, tree type)
8300 {
8301   create_convert_operand_from (op, value, TYPE_MODE (type),
8302                                TYPE_UNSIGNED (type));
8303 }
8304
8305 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
8306    of instruction ICODE.  Return true on success, leaving the new operand
8307    values in the OPS themselves.  Emit no code on failure.  */
8308
8309 bool
8310 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
8311                            unsigned int nops, struct expand_operand *ops)
8312 {
8313   rtx_insn *last;
8314   unsigned int i;
8315
8316   last = get_last_insn ();
8317   for (i = 0; i < nops; i++)
8318     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
8319       {
8320         delete_insns_since (last);
8321         return false;
8322       }
8323   return true;
8324 }
8325
8326 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
8327    as its operands.  Return the instruction pattern on success,
8328    and emit any necessary set-up code.  Return null and emit no
8329    code on failure.  */
8330
8331 rtx
8332 maybe_gen_insn (enum insn_code icode, unsigned int nops,
8333                 struct expand_operand *ops)
8334 {
8335   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
8336   if (!maybe_legitimize_operands (icode, 0, nops, ops))
8337     return NULL_RTX;
8338
8339   switch (nops)
8340     {
8341     case 1:
8342       return GEN_FCN (icode) (ops[0].value);
8343     case 2:
8344       return GEN_FCN (icode) (ops[0].value, ops[1].value);
8345     case 3:
8346       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
8347     case 4:
8348       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8349                               ops[3].value);
8350     case 5:
8351       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8352                               ops[3].value, ops[4].value);
8353     case 6:
8354       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8355                               ops[3].value, ops[4].value, ops[5].value);
8356     case 7:
8357       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8358                               ops[3].value, ops[4].value, ops[5].value,
8359                               ops[6].value);
8360     case 8:
8361       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8362                               ops[3].value, ops[4].value, ops[5].value,
8363                               ops[6].value, ops[7].value);
8364     case 9:
8365       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8366                               ops[3].value, ops[4].value, ops[5].value,
8367                               ops[6].value, ops[7].value, ops[8].value);
8368     }
8369   gcc_unreachable ();
8370 }
8371
8372 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
8373    as its operands.  Return true on success and emit no code on failure.  */
8374
8375 bool
8376 maybe_expand_insn (enum insn_code icode, unsigned int nops,
8377                    struct expand_operand *ops)
8378 {
8379   rtx pat = maybe_gen_insn (icode, nops, ops);
8380   if (pat)
8381     {
8382       emit_insn (pat);
8383       return true;
8384     }
8385   return false;
8386 }
8387
8388 /* Like maybe_expand_insn, but for jumps.  */
8389
8390 bool
8391 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
8392                         struct expand_operand *ops)
8393 {
8394   rtx pat = maybe_gen_insn (icode, nops, ops);
8395   if (pat)
8396     {
8397       emit_jump_insn (pat);
8398       return true;
8399     }
8400   return false;
8401 }
8402
8403 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
8404    as its operands.  */
8405
8406 void
8407 expand_insn (enum insn_code icode, unsigned int nops,
8408              struct expand_operand *ops)
8409 {
8410   if (!maybe_expand_insn (icode, nops, ops))
8411     gcc_unreachable ();
8412 }
8413
8414 /* Like expand_insn, but for jumps.  */
8415
8416 void
8417 expand_jump_insn (enum insn_code icode, unsigned int nops,
8418                   struct expand_operand *ops)
8419 {
8420   if (!maybe_expand_jump_insn (icode, nops, ops))
8421     gcc_unreachable ();
8422 }
8423
8424 /* Reduce conditional compilation elsewhere.  */
8425 #ifndef HAVE_insv
8426 #define HAVE_insv       0
8427 #define CODE_FOR_insv   CODE_FOR_nothing
8428 #endif
8429 #ifndef HAVE_extv
8430 #define HAVE_extv       0
8431 #define CODE_FOR_extv   CODE_FOR_nothing
8432 #endif
8433 #ifndef HAVE_extzv
8434 #define HAVE_extzv      0
8435 #define CODE_FOR_extzv  CODE_FOR_nothing
8436 #endif
8437
8438 /* Enumerates the possible types of structure operand to an
8439    extraction_insn.  */
8440 enum extraction_type { ET_unaligned_mem, ET_reg };
8441
8442 /* Check whether insv, extv or extzv pattern ICODE can be used for an
8443    insertion or extraction of type TYPE on a structure of mode MODE.
8444    Return true if so and fill in *INSN accordingly.  STRUCT_OP is the
8445    operand number of the structure (the first sign_extract or zero_extract
8446    operand) and FIELD_OP is the operand number of the field (the other
8447    side of the set from the sign_extract or zero_extract).  */
8448
8449 static bool
8450 get_traditional_extraction_insn (extraction_insn *insn,
8451                                  enum extraction_type type,
8452                                  machine_mode mode,
8453                                  enum insn_code icode,
8454                                  int struct_op, int field_op)
8455 {
8456   const struct insn_data_d *data = &insn_data[icode];
8457
8458   machine_mode struct_mode = data->operand[struct_op].mode;
8459   if (struct_mode == VOIDmode)
8460     struct_mode = word_mode;
8461   if (mode != struct_mode)
8462     return false;
8463
8464   machine_mode field_mode = data->operand[field_op].mode;
8465   if (field_mode == VOIDmode)
8466     field_mode = word_mode;
8467
8468   machine_mode pos_mode = data->operand[struct_op + 2].mode;
8469   if (pos_mode == VOIDmode)
8470     pos_mode = word_mode;
8471
8472   insn->icode = icode;
8473   insn->field_mode = field_mode;
8474   insn->struct_mode = (type == ET_unaligned_mem ? byte_mode : struct_mode);
8475   insn->pos_mode = pos_mode;
8476   return true;
8477 }
8478
8479 /* Return true if an optab exists to perform an insertion or extraction
8480    of type TYPE in mode MODE.  Describe the instruction in *INSN if so.
8481
8482    REG_OPTAB is the optab to use for register structures and
8483    MISALIGN_OPTAB is the optab to use for misaligned memory structures.
8484    POS_OP is the operand number of the bit position.  */
8485
8486 static bool
8487 get_optab_extraction_insn (struct extraction_insn *insn,
8488                            enum extraction_type type,
8489                            machine_mode mode, direct_optab reg_optab,
8490                            direct_optab misalign_optab, int pos_op)
8491 {
8492   direct_optab optab = (type == ET_unaligned_mem ? misalign_optab : reg_optab);
8493   enum insn_code icode = direct_optab_handler (optab, mode);
8494   if (icode == CODE_FOR_nothing)
8495     return false;
8496
8497   const struct insn_data_d *data = &insn_data[icode];
8498
8499   insn->icode = icode;
8500   insn->field_mode = mode;
8501   insn->struct_mode = (type == ET_unaligned_mem ? BLKmode : mode);
8502   insn->pos_mode = data->operand[pos_op].mode;
8503   if (insn->pos_mode == VOIDmode)
8504     insn->pos_mode = word_mode;
8505   return true;
8506 }
8507
8508 /* Return true if an instruction exists to perform an insertion or
8509    extraction (PATTERN says which) of type TYPE in mode MODE.
8510    Describe the instruction in *INSN if so.  */
8511
8512 static bool
8513 get_extraction_insn (extraction_insn *insn,
8514                      enum extraction_pattern pattern,
8515                      enum extraction_type type,
8516                      machine_mode mode)
8517 {
8518   switch (pattern)
8519     {
8520     case EP_insv:
8521       if (HAVE_insv
8522           && get_traditional_extraction_insn (insn, type, mode,
8523                                               CODE_FOR_insv, 0, 3))
8524         return true;
8525       return get_optab_extraction_insn (insn, type, mode, insv_optab,
8526                                         insvmisalign_optab, 2);
8527
8528     case EP_extv:
8529       if (HAVE_extv
8530           && get_traditional_extraction_insn (insn, type, mode,
8531                                               CODE_FOR_extv, 1, 0))
8532         return true;
8533       return get_optab_extraction_insn (insn, type, mode, extv_optab,
8534                                         extvmisalign_optab, 3);
8535
8536     case EP_extzv:
8537       if (HAVE_extzv
8538           && get_traditional_extraction_insn (insn, type, mode,
8539                                               CODE_FOR_extzv, 1, 0))
8540         return true;
8541       return get_optab_extraction_insn (insn, type, mode, extzv_optab,
8542                                         extzvmisalign_optab, 3);
8543
8544     default:
8545       gcc_unreachable ();
8546     }
8547 }
8548
8549 /* Return true if an instruction exists to access a field of mode
8550    FIELDMODE in a structure that has STRUCT_BITS significant bits.
8551    Describe the "best" such instruction in *INSN if so.  PATTERN and
8552    TYPE describe the type of insertion or extraction we want to perform.
8553
8554    For an insertion, the number of significant structure bits includes
8555    all bits of the target.  For an extraction, it need only include the
8556    most significant bit of the field.  Larger widths are acceptable
8557    in both cases.  */
8558
8559 static bool
8560 get_best_extraction_insn (extraction_insn *insn,
8561                           enum extraction_pattern pattern,
8562                           enum extraction_type type,
8563                           unsigned HOST_WIDE_INT struct_bits,
8564                           machine_mode field_mode)
8565 {
8566   machine_mode mode = smallest_mode_for_size (struct_bits, MODE_INT);
8567   while (mode != VOIDmode)
8568     {
8569       if (get_extraction_insn (insn, pattern, type, mode))
8570         {
8571           while (mode != VOIDmode
8572                  && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (field_mode)
8573                  && !TRULY_NOOP_TRUNCATION_MODES_P (insn->field_mode,
8574                                                     field_mode))
8575             {
8576               get_extraction_insn (insn, pattern, type, mode);
8577               mode = GET_MODE_WIDER_MODE (mode);
8578             }
8579           return true;
8580         }
8581       mode = GET_MODE_WIDER_MODE (mode);
8582     }
8583   return false;
8584 }
8585
8586 /* Return true if an instruction exists to access a field of mode
8587    FIELDMODE in a register structure that has STRUCT_BITS significant bits.
8588    Describe the "best" such instruction in *INSN if so.  PATTERN describes
8589    the type of insertion or extraction we want to perform.
8590
8591    For an insertion, the number of significant structure bits includes
8592    all bits of the target.  For an extraction, it need only include the
8593    most significant bit of the field.  Larger widths are acceptable
8594    in both cases.  */
8595
8596 bool
8597 get_best_reg_extraction_insn (extraction_insn *insn,
8598                               enum extraction_pattern pattern,
8599                               unsigned HOST_WIDE_INT struct_bits,
8600                               machine_mode field_mode)
8601 {
8602   return get_best_extraction_insn (insn, pattern, ET_reg, struct_bits,
8603                                    field_mode);
8604 }
8605
8606 /* Return true if an instruction exists to access a field of BITSIZE
8607    bits starting BITNUM bits into a memory structure.  Describe the
8608    "best" such instruction in *INSN if so.  PATTERN describes the type
8609    of insertion or extraction we want to perform and FIELDMODE is the
8610    natural mode of the extracted field.
8611
8612    The instructions considered here only access bytes that overlap
8613    the bitfield; they do not touch any surrounding bytes.  */
8614
8615 bool
8616 get_best_mem_extraction_insn (extraction_insn *insn,
8617                               enum extraction_pattern pattern,
8618                               HOST_WIDE_INT bitsize, HOST_WIDE_INT bitnum,
8619                               machine_mode field_mode)
8620 {
8621   unsigned HOST_WIDE_INT struct_bits = (bitnum % BITS_PER_UNIT
8622                                         + bitsize
8623                                         + BITS_PER_UNIT - 1);
8624   struct_bits -= struct_bits % BITS_PER_UNIT;
8625   return get_best_extraction_insn (insn, pattern, ET_unaligned_mem,
8626                                    struct_bits, field_mode);
8627 }
8628
8629 /* Determine whether "1 << x" is relatively cheap in word_mode.  */
8630
8631 bool
8632 lshift_cheap_p (bool speed_p)
8633 {
8634   /* FIXME: This should be made target dependent via this "this_target"
8635      mechanism, similar to e.g. can_copy_init_p in gcse.c.  */
8636   static bool init[2] = { false, false };
8637   static bool cheap[2] = { true, true };
8638
8639   /* If the targer has no lshift in word_mode, the operation will most
8640      probably not be cheap.  ??? Does GCC even work for such targets?  */
8641   if (optab_handler (ashl_optab, word_mode) == CODE_FOR_nothing)
8642     return false;
8643
8644   if (!init[speed_p])
8645     {
8646       rtx reg = gen_raw_REG (word_mode, 10000);
8647       int cost = set_src_cost (gen_rtx_ASHIFT (word_mode, const1_rtx, reg),
8648                                speed_p);
8649       cheap[speed_p] = cost < COSTS_N_INSNS (3);
8650       init[speed_p] = true;
8651     }
8652
8653   return cheap[speed_p];
8654 }
8655
8656 #include "gt-optabs.h"