gcc-4_9-branch/gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2014 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "tm.h"
  25 #include "diagnostic-core.h"
  26
  27 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  28    is properly defined.  */
  29 #include "insn-config.h"
  30 #include "rtl.h"
  31 #include "tree.h"
  32 #include "stor-layout.h"
  33 #include "stringpool.h"
  34 #include "varasm.h"
  35 #include "tm_p.h"
  36 #include "flags.h"
  37 #include "function.h"
  38 #include "except.h"
  39 #include "expr.h"
  40 #include "optabs.h"
  41 #include "libfuncs.h"
  42 #include "recog.h"
  43 #include "reload.h"
  44 #include "ggc.h"
  45 #include "basic-block.h"
  46 #include "target.h"
  47
  48 struct target_optabs default_target_optabs;
  49 struct target_libfuncs default_target_libfuncs;
  50 struct target_optabs *this_fn_optabs = &default_target_optabs;
  51 #if SWITCHABLE_TARGET
  52 struct target_optabs *this_target_optabs = &default_target_optabs;
  53 struct target_libfuncs *this_target_libfuncs = &default_target_libfuncs;
  54 #endif
  55
  56 #define libfunc_hash \
  57   (this_target_libfuncs->x_libfunc_hash)
  58
  59 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  60                                    enum machine_mode *);
  61 static rtx expand_unop_direct (enum machine_mode, optab, rtx, rtx, int);
  62 static void emit_libcall_block_1 (rtx, rtx, rtx, rtx, bool);
  63
  64 /* Debug facility for use in GDB.  */
  65 void debug_optab_libfuncs (void);
  66
  67 /* Prefixes for the current version of decimal floating point (BID vs. DPD) */
  68 #if ENABLE_DECIMAL_BID_FORMAT
  69 #define DECIMAL_PREFIX "bid_"
  70 #else
  71 #define DECIMAL_PREFIX "dpd_"
  72 #endif
  73 \f
  74 /* Used for libfunc_hash.  */
  75
  76 static hashval_t
  77 hash_libfunc (const void *p)
  78 {
  79   const struct libfunc_entry *const e = (const struct libfunc_entry *) p;
  80   return ((e->mode1 + e->mode2 * NUM_MACHINE_MODES) ^ e->op);
  81 }
  82
  83 /* Used for libfunc_hash.  */
  84
  85 static int
  86 eq_libfunc (const void *p, const void *q)
  87 {
  88   const struct libfunc_entry *const e1 = (const struct libfunc_entry *) p;
  89   const struct libfunc_entry *const e2 = (const struct libfunc_entry *) q;
  90   return e1->op == e2->op && e1->mode1 == e2->mode1 && e1->mode2 == e2->mode2;
  91 }
  92
  93 /* Return libfunc corresponding operation defined by OPTAB converting
  94    from MODE2 to MODE1.  Trigger lazy initialization if needed, return NULL
  95    if no libfunc is available.  */
  96 rtx
  97 convert_optab_libfunc (convert_optab optab, enum machine_mode mode1,
  98                        enum machine_mode mode2)
  99 {
 100   struct libfunc_entry e;
 101   struct libfunc_entry **slot;
 102
 103   /* ??? This ought to be an assert, but not all of the places
 104      that we expand optabs know about the optabs that got moved
 105      to being direct.  */
 106   if (!(optab >= FIRST_CONV_OPTAB && optab <= LAST_CONVLIB_OPTAB))
 107     return NULL_RTX;
 108
 109   e.op = optab;
 110   e.mode1 = mode1;
 111   e.mode2 = mode2;
 112   slot = (struct libfunc_entry **)
 113     htab_find_slot (libfunc_hash, &e, NO_INSERT);
 114   if (!slot)
 115     {
 116       const struct convert_optab_libcall_d *d
 117         = &convlib_def[optab - FIRST_CONV_OPTAB];
 118
 119       if (d->libcall_gen == NULL)
 120         return NULL;
 121
 122       d->libcall_gen (optab, d->libcall_basename, mode1, mode2);
 123       slot = (struct libfunc_entry **)
 124         htab_find_slot (libfunc_hash, &e, NO_INSERT);
 125       if (!slot)
 126         return NULL;
 127     }
 128   return (*slot)->libfunc;
 129 }
 130
 131 /* Return libfunc corresponding operation defined by OPTAB in MODE.
 132    Trigger lazy initialization if needed, return NULL if no libfunc is
 133    available.  */
 134 rtx
 135 optab_libfunc (optab optab, enum machine_mode mode)
 136 {
 137   struct libfunc_entry e;
 138   struct libfunc_entry **slot;
 139
 140   /* ??? This ought to be an assert, but not all of the places
 141      that we expand optabs know about the optabs that got moved
 142      to being direct.  */
 143   if (!(optab >= FIRST_NORM_OPTAB && optab <= LAST_NORMLIB_OPTAB))
 144     return NULL_RTX;
 145
 146   e.op = optab;
 147   e.mode1 = mode;
 148   e.mode2 = VOIDmode;
 149   slot = (struct libfunc_entry **)
 150     htab_find_slot (libfunc_hash, &e, NO_INSERT);
 151   if (!slot)
 152     {
 153       const struct optab_libcall_d *d
 154         = &normlib_def[optab - FIRST_NORM_OPTAB];
 155
 156       if (d->libcall_gen == NULL)
 157         return NULL;
 158
 159       d->libcall_gen (optab, d->libcall_basename, d->libcall_suffix, mode);
 160       slot = (struct libfunc_entry **)
 161         htab_find_slot (libfunc_hash, &e, NO_INSERT);
 162       if (!slot)
 163         return NULL;
 164     }
 165   return (*slot)->libfunc;
 166 }
 167
 168 \f
 169 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
 170    the result of operation CODE applied to OP0 (and OP1 if it is a binary
 171    operation).
 172
 173    If the last insn does not set TARGET, don't do anything, but return 1.
 174
 175    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
 176    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
 177    try again, ensuring that TARGET is not one of the operands.  */
 178
 179 static int
 180 add_equal_note (rtx insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
 181 {
 182   rtx last_insn, set;
 183   rtx note;
 184
 185   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
 186
 187   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
 188       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
 189       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
 190       && GET_RTX_CLASS (code) != RTX_COMPARE
 191       && GET_RTX_CLASS (code) != RTX_UNARY)
 192     return 1;
 193
 194   if (GET_CODE (target) == ZERO_EXTRACT)
 195     return 1;
 196
 197   for (last_insn = insns;
 198        NEXT_INSN (last_insn) != NULL_RTX;
 199        last_insn = NEXT_INSN (last_insn))
 200     ;
 201
 202   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
 203      a value changing in the insn, so the note would be invalid for CSE.  */
 204   if (reg_overlap_mentioned_p (target, op0)
 205       || (op1 && reg_overlap_mentioned_p (target, op1)))
 206     {
 207       if (MEM_P (target)
 208           && (rtx_equal_p (target, op0)
 209               || (op1 && rtx_equal_p (target, op1))))
 210         {
 211           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 212              over expanding it as temp = MEM op X, MEM = temp.  If the target
 213              supports MEM = MEM op X instructions, it is sometimes too hard
 214              to reconstruct that form later, especially if X is also a memory,
 215              and due to multiple occurrences of addresses the address might
 216              be forced into register unnecessarily.
 217              Note that not emitting the REG_EQUIV note might inhibit
 218              CSE in some cases.  */
 219           set = single_set (last_insn);
 220           if (set
 221               && GET_CODE (SET_SRC (set)) == code
 222               && MEM_P (SET_DEST (set))
 223               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 224                   || (op1 && rtx_equal_p (SET_DEST (set),
 225                                           XEXP (SET_SRC (set), 1)))))
 226             return 1;
 227         }
 228       return 0;
 229     }
 230
 231   set = single_set (last_insn);
 232   if (set == NULL_RTX)
 233     return 1;
 234
 235   if (! rtx_equal_p (SET_DEST (set), target)
 236       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 237       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 238           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 239     return 1;
 240
 241   if (GET_RTX_CLASS (code) == RTX_UNARY)
 242     switch (code)
 243       {
 244       case FFS:
 245       case CLZ:
 246       case CTZ:
 247       case CLRSB:
 248       case POPCOUNT:
 249       case PARITY:
 250       case BSWAP:
 251         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 252           {
 253             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 254             if (GET_MODE_SIZE (GET_MODE (op0))
 255                 > GET_MODE_SIZE (GET_MODE (target)))
 256               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 257                                          note, GET_MODE (op0));
 258             else
 259               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 260                                          note, GET_MODE (op0));
 261             break;
 262           }
 263         /* FALLTHRU */
 264       default:
 265         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 266         break;
 267       }
 268   else
 269     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 270
 271   set_unique_reg_note (last_insn, REG_EQUAL, note);
 272
 273   return 1;
 274 }
 275 \f
 276 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 277    for a widening operation would be.  In most cases this would be OP0, but if
 278    that's a constant it'll be VOIDmode, which isn't useful.  */
 279
 280 static enum machine_mode
 281 widened_mode (enum machine_mode to_mode, rtx op0, rtx op1)
 282 {
 283   enum machine_mode m0 = GET_MODE (op0);
 284   enum machine_mode m1 = GET_MODE (op1);
 285   enum machine_mode result;
 286
 287   if (m0 == VOIDmode && m1 == VOIDmode)
 288     return to_mode;
 289   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 290     result = m1;
 291   else
 292     result = m0;
 293
 294   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 295     return to_mode;
 296
 297   return result;
 298 }
 299 \f
 300 /* Find a widening optab even if it doesn't widen as much as we want.
 301    E.g. if from_mode is HImode, and to_mode is DImode, and there is no
 302    direct HI->SI insn, then return SI->DI, if that exists.
 303    If PERMIT_NON_WIDENING is non-zero then this can be used with
 304    non-widening optabs also.  */
 305
 306 enum insn_code
 307 find_widening_optab_handler_and_mode (optab op, enum machine_mode to_mode,
 308                                       enum machine_mode from_mode,
 309                                       int permit_non_widening,
 310                                       enum machine_mode *found_mode)
 311 {
 312   for (; (permit_non_widening || from_mode != to_mode)
 313          && GET_MODE_SIZE (from_mode) <= GET_MODE_SIZE (to_mode)
 314          && from_mode != VOIDmode;
 315        from_mode = GET_MODE_WIDER_MODE (from_mode))
 316     {
 317       enum insn_code handler = widening_optab_handler (op, to_mode,
 318                                                        from_mode);
 319
 320       if (handler != CODE_FOR_nothing)
 321         {
 322           if (found_mode)
 323             *found_mode = from_mode;
 324           return handler;
 325         }
 326     }
 327
 328   return CODE_FOR_nothing;
 329 }
 330 \f
 331 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 332    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 333    not actually do a sign-extend or zero-extend, but can leave the
 334    higher-order bits of the result rtx undefined, for example, in the case
 335    of logical operations, but not right shifts.  */
 336
 337 static rtx
 338 widen_operand (rtx op, enum machine_mode mode, enum machine_mode oldmode,
 339                int unsignedp, int no_extend)
 340 {
 341   rtx result;
 342
 343   /* If we don't have to extend and this is a constant, return it.  */
 344   if (no_extend && GET_MODE (op) == VOIDmode)
 345     return op;
 346
 347   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 348      extend since it will be more efficient to do so unless the signedness of
 349      a promoted object differs from our extension.  */
 350   if (! no_extend
 351       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 352           && SUBREG_PROMOTED_UNSIGNED_P (op) == unsignedp))
 353     return convert_modes (mode, oldmode, op, unsignedp);
 354
 355   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 356      SUBREG.  */
 357   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
 358     return gen_lowpart (mode, force_reg (GET_MODE (op), op));
 359
 360   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 361      part to OP.  */
 362
 363   result = gen_reg_rtx (mode);
 364   emit_clobber (result);
 365   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 366   return result;
 367 }
 368 \f
 369 /* Return the optab used for computing the operation given by the tree code,
 370    CODE and the tree EXP.  This function is not always usable (for example, it
 371    cannot give complete results for multiplication or division) but probably
 372    ought to be relied on more widely throughout the expander.  */
 373 optab
 374 optab_for_tree_code (enum tree_code code, const_tree type,
 375                      enum optab_subtype subtype)
 376 {
 377   bool trapv;
 378   switch (code)
 379     {
 380     case BIT_AND_EXPR:
 381       return and_optab;
 382
 383     case BIT_IOR_EXPR:
 384       return ior_optab;
 385
 386     case BIT_NOT_EXPR:
 387       return one_cmpl_optab;
 388
 389     case BIT_XOR_EXPR:
 390       return xor_optab;
 391
 392     case MULT_HIGHPART_EXPR:
 393       return TYPE_UNSIGNED (type) ? umul_highpart_optab : smul_highpart_optab;
 394
 395     case TRUNC_MOD_EXPR:
 396     case CEIL_MOD_EXPR:
 397     case FLOOR_MOD_EXPR:
 398     case ROUND_MOD_EXPR:
 399       return TYPE_UNSIGNED (type) ? umod_optab : smod_optab;
 400
 401     case RDIV_EXPR:
 402     case TRUNC_DIV_EXPR:
 403     case CEIL_DIV_EXPR:
 404     case FLOOR_DIV_EXPR:
 405     case ROUND_DIV_EXPR:
 406     case EXACT_DIV_EXPR:
 407       if (TYPE_SATURATING (type))
 408         return TYPE_UNSIGNED (type) ? usdiv_optab : ssdiv_optab;
 409       return TYPE_UNSIGNED (type) ? udiv_optab : sdiv_optab;
 410
 411     case LSHIFT_EXPR:
 412       if (TREE_CODE (type) == VECTOR_TYPE)
 413         {
 414           if (subtype == optab_vector)
 415             return TYPE_SATURATING (type) ? unknown_optab : vashl_optab;
 416
 417           gcc_assert (subtype == optab_scalar);
 418         }
 419       if (TYPE_SATURATING (type))
 420         return TYPE_UNSIGNED (type) ? usashl_optab : ssashl_optab;
 421       return ashl_optab;
 422
 423     case RSHIFT_EXPR:
 424       if (TREE_CODE (type) == VECTOR_TYPE)
 425         {
 426           if (subtype == optab_vector)
 427             return TYPE_UNSIGNED (type) ? vlshr_optab : vashr_optab;
 428
 429           gcc_assert (subtype == optab_scalar);
 430         }
 431       return TYPE_UNSIGNED (type) ? lshr_optab : ashr_optab;
 432
 433     case LROTATE_EXPR:
 434       if (TREE_CODE (type) == VECTOR_TYPE)
 435         {
 436           if (subtype == optab_vector)
 437             return vrotl_optab;
 438
 439           gcc_assert (subtype == optab_scalar);
 440         }
 441       return rotl_optab;
 442
 443     case RROTATE_EXPR:
 444       if (TREE_CODE (type) == VECTOR_TYPE)
 445         {
 446           if (subtype == optab_vector)
 447             return vrotr_optab;
 448
 449           gcc_assert (subtype == optab_scalar);
 450         }
 451       return rotr_optab;
 452
 453     case MAX_EXPR:
 454       return TYPE_UNSIGNED (type) ? umax_optab : smax_optab;
 455
 456     case MIN_EXPR:
 457       return TYPE_UNSIGNED (type) ? umin_optab : smin_optab;
 458
 459     case REALIGN_LOAD_EXPR:
 460       return vec_realign_load_optab;
 461
 462     case WIDEN_SUM_EXPR:
 463       return TYPE_UNSIGNED (type) ? usum_widen_optab : ssum_widen_optab;
 464
 465     case DOT_PROD_EXPR:
 466       return TYPE_UNSIGNED (type) ? udot_prod_optab : sdot_prod_optab;
 467
 468     case WIDEN_MULT_PLUS_EXPR:
 469       return (TYPE_UNSIGNED (type)
 470               ? (TYPE_SATURATING (type)
 471                  ? usmadd_widen_optab : umadd_widen_optab)
 472               : (TYPE_SATURATING (type)
 473                  ? ssmadd_widen_optab : smadd_widen_optab));
 474
 475     case WIDEN_MULT_MINUS_EXPR:
 476       return (TYPE_UNSIGNED (type)
 477               ? (TYPE_SATURATING (type)
 478                  ? usmsub_widen_optab : umsub_widen_optab)
 479               : (TYPE_SATURATING (type)
 480                  ? ssmsub_widen_optab : smsub_widen_optab));
 481
 482     case FMA_EXPR:
 483       return fma_optab;
 484
 485     case REDUC_MAX_EXPR:
 486       return TYPE_UNSIGNED (type)
 487              ? reduc_umax_scal_optab : reduc_smax_scal_optab;
 488
 489     case REDUC_MIN_EXPR:
 490       return TYPE_UNSIGNED (type)
 491              ? reduc_umin_scal_optab : reduc_smin_scal_optab;
 492
 493     case REDUC_PLUS_EXPR:
 494       return reduc_plus_scal_optab;
 495
 496     case VEC_RSHIFT_EXPR:
 497       return vec_shr_optab;
 498
 499     case VEC_WIDEN_MULT_HI_EXPR:
 500       return TYPE_UNSIGNED (type) ?
 501         vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
 502
 503     case VEC_WIDEN_MULT_LO_EXPR:
 504       return TYPE_UNSIGNED (type) ?
 505         vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
 506
 507     case VEC_WIDEN_MULT_EVEN_EXPR:
 508       return TYPE_UNSIGNED (type) ?
 509         vec_widen_umult_even_optab : vec_widen_smult_even_optab;
 510
 511     case VEC_WIDEN_MULT_ODD_EXPR:
 512       return TYPE_UNSIGNED (type) ?
 513         vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
 514
 515     case VEC_WIDEN_LSHIFT_HI_EXPR:
 516       return TYPE_UNSIGNED (type) ?
 517         vec_widen_ushiftl_hi_optab : vec_widen_sshiftl_hi_optab;
 518
 519     case VEC_WIDEN_LSHIFT_LO_EXPR:
 520       return TYPE_UNSIGNED (type) ?
 521         vec_widen_ushiftl_lo_optab : vec_widen_sshiftl_lo_optab;
 522
 523     case VEC_UNPACK_HI_EXPR:
 524       return TYPE_UNSIGNED (type) ?
 525         vec_unpacku_hi_optab : vec_unpacks_hi_optab;
 526
 527     case VEC_UNPACK_LO_EXPR:
 528       return TYPE_UNSIGNED (type) ?
 529         vec_unpacku_lo_optab : vec_unpacks_lo_optab;
 530
 531     case VEC_UNPACK_FLOAT_HI_EXPR:
 532       /* The signedness is determined from input operand.  */
 533       return TYPE_UNSIGNED (type) ?
 534         vec_unpacku_float_hi_optab : vec_unpacks_float_hi_optab;
 535
 536     case VEC_UNPACK_FLOAT_LO_EXPR:
 537       /* The signedness is determined from input operand.  */
 538       return TYPE_UNSIGNED (type) ?
 539         vec_unpacku_float_lo_optab : vec_unpacks_float_lo_optab;
 540
 541     case VEC_PACK_TRUNC_EXPR:
 542       return vec_pack_trunc_optab;
 543
 544     case VEC_PACK_SAT_EXPR:
 545       return TYPE_UNSIGNED (type) ? vec_pack_usat_optab : vec_pack_ssat_optab;
 546
 547     case VEC_PACK_FIX_TRUNC_EXPR:
 548       /* The signedness is determined from output operand.  */
 549       return TYPE_UNSIGNED (type) ?
 550         vec_pack_ufix_trunc_optab : vec_pack_sfix_trunc_optab;
 551
 552     default:
 553       break;
 554     }
 555
 556   trapv = INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type);
 557   switch (code)
 558     {
 559     case POINTER_PLUS_EXPR:
 560     case PLUS_EXPR:
 561       if (TYPE_SATURATING (type))
 562         return TYPE_UNSIGNED (type) ? usadd_optab : ssadd_optab;
 563       return trapv ? addv_optab : add_optab;
 564
 565     case MINUS_EXPR:
 566       if (TYPE_SATURATING (type))
 567         return TYPE_UNSIGNED (type) ? ussub_optab : sssub_optab;
 568       return trapv ? subv_optab : sub_optab;
 569
 570     case MULT_EXPR:
 571       if (TYPE_SATURATING (type))
 572         return TYPE_UNSIGNED (type) ? usmul_optab : ssmul_optab;
 573       return trapv ? smulv_optab : smul_optab;
 574
 575     case NEGATE_EXPR:
 576       if (TYPE_SATURATING (type))
 577         return TYPE_UNSIGNED (type) ? usneg_optab : ssneg_optab;
 578       return trapv ? negv_optab : neg_optab;
 579
 580     case ABS_EXPR:
 581       return trapv ? absv_optab : abs_optab;
 582
 583     default:
 584       return unknown_optab;
 585     }
 586 }
 587
 588 /* Given optab UNOPTAB that reduces a vector to a scalar, find instead the old
 589    optab that produces a vector with the reduction result in one element,
 590    for a tree with type TYPE.  */
 591
 592 optab
 593 scalar_reduc_to_vector (optab unoptab, const_tree type)
 594 {
 595   switch (unoptab)
 596     {
 597     case reduc_plus_scal_optab:
 598       return TYPE_UNSIGNED (type) ? reduc_uplus_optab : reduc_splus_optab;
 599
 600     case reduc_smin_scal_optab: return reduc_smin_optab;
 601     case reduc_umin_scal_optab: return reduc_umin_optab;
 602     case reduc_smax_scal_optab: return reduc_smax_optab;
 603     case reduc_umax_scal_optab: return reduc_umax_optab;
 604     default: return unknown_optab;
 605     }
 606 }
 607
 608 /* Expand vector widening operations.
 609
 610    There are two different classes of operations handled here:
 611    1) Operations whose result is wider than all the arguments to the operation.
 612       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 613       In this case OP0 and optionally OP1 would be initialized,
 614       but WIDE_OP wouldn't (not relevant for this case).
 615    2) Operations whose result is of the same size as the last argument to the
 616       operation, but wider than all the other arguments to the operation.
 617       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 618       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 619
 620    E.g, when called to expand the following operations, this is how
 621    the arguments will be initialized:
 622                                 nops    OP0     OP1     WIDE_OP
 623    widening-sum                 2       oprnd0  -       oprnd1
 624    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 625    widening-mult                2       oprnd0  oprnd1  -
 626    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 627
 628 rtx
 629 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 630                            rtx target, int unsignedp)
 631 {
 632   struct expand_operand eops[4];
 633   tree oprnd0, oprnd1, oprnd2;
 634   enum machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 635   optab widen_pattern_optab;
 636   enum insn_code icode;
 637   int nops = TREE_CODE_LENGTH (ops->code);
 638   int op;
 639
 640   oprnd0 = ops->op0;
 641   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 642   widen_pattern_optab =
 643     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 644   if (ops->code == WIDEN_MULT_PLUS_EXPR
 645       || ops->code == WIDEN_MULT_MINUS_EXPR)
 646     icode = find_widening_optab_handler (widen_pattern_optab,
 647                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 648                                          tmode0, 0);
 649   else
 650     icode = optab_handler (widen_pattern_optab, tmode0);
 651   gcc_assert (icode != CODE_FOR_nothing);
 652
 653   if (nops >= 2)
 654     {
 655       oprnd1 = ops->op1;
 656       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 657     }
 658
 659   /* The last operand is of a wider mode than the rest of the operands.  */
 660   if (nops == 2)
 661     wmode = tmode1;
 662   else if (nops == 3)
 663     {
 664       gcc_assert (tmode1 == tmode0);
 665       gcc_assert (op1);
 666       oprnd2 = ops->op2;
 667       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 668     }
 669
 670   op = 0;
 671   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 672   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 673   if (op1)
 674     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 675   if (wide_op)
 676     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 677   expand_insn (icode, op, eops);
 678   return eops[0].value;
 679 }
 680
 681 /* Generate code to perform an operation specified by TERNARY_OPTAB
 682    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 683
 684    UNSIGNEDP is for the case where we have to widen the operands
 685    to perform the operation.  It says to use zero-extension.
 686
 687    If TARGET is nonzero, the value
 688    is generated there, if it is convenient to do so.
 689    In all cases an rtx is returned for the locus of the value;
 690    this may or may not be TARGET.  */
 691
 692 rtx
 693 expand_ternary_op (enum machine_mode mode, optab ternary_optab, rtx op0,
 694                    rtx op1, rtx op2, rtx target, int unsignedp)
 695 {
 696   struct expand_operand ops[4];
 697   enum insn_code icode = optab_handler (ternary_optab, mode);
 698
 699   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 700
 701   create_output_operand (&ops[0], target, mode);
 702   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 703   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 704   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 705   expand_insn (icode, 4, ops);
 706   return ops[0].value;
 707 }
 708
 709
 710 /* Like expand_binop, but return a constant rtx if the result can be
 711    calculated at compile time.  The arguments and return value are
 712    otherwise the same as for expand_binop.  */
 713
 714 rtx
 715 simplify_expand_binop (enum machine_mode mode, optab binoptab,
 716                        rtx op0, rtx op1, rtx target, int unsignedp,
 717                        enum optab_methods methods)
 718 {
 719   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 720     {
 721       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 722                                          mode, op0, op1);
 723       if (x)
 724         return x;
 725     }
 726
 727   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 728 }
 729
 730 /* Like simplify_expand_binop, but always put the result in TARGET.
 731    Return true if the expansion succeeded.  */
 732
 733 bool
 734 force_expand_binop (enum machine_mode mode, optab binoptab,
 735                     rtx op0, rtx op1, rtx target, int unsignedp,
 736                     enum optab_methods methods)
 737 {
 738   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 739                                  target, unsignedp, methods);
 740   if (x == 0)
 741     return false;
 742   if (x != target)
 743     emit_move_insn (target, x);
 744   return true;
 745 }
 746
 747 /* Generate insns for VEC_RSHIFT_EXPR.  */
 748
 749 rtx
 750 expand_vec_shift_expr (sepops ops, rtx target)
 751 {
 752   struct expand_operand eops[3];
 753   enum insn_code icode;
 754   rtx rtx_op1, rtx_op2;
 755   enum machine_mode mode = TYPE_MODE (ops->type);
 756   tree vec_oprnd = ops->op0;
 757   tree shift_oprnd = ops->op1;
 758
 759   gcc_assert (ops->code == VEC_RSHIFT_EXPR);
 760
 761   icode = optab_handler (vec_shr_optab, mode);
 762   gcc_assert (icode != CODE_FOR_nothing);
 763
 764   rtx_op1 = expand_normal (vec_oprnd);
 765   rtx_op2 = expand_normal (shift_oprnd);
 766
 767   create_output_operand (&eops[0], target, mode);
 768   create_input_operand (&eops[1], rtx_op1, GET_MODE (rtx_op1));
 769   create_convert_operand_from_type (&eops[2], rtx_op2, TREE_TYPE (shift_oprnd));
 770   expand_insn (icode, 3, eops);
 771
 772   return eops[0].value;
 773 }
 774
 775 /* Create a new vector value in VMODE with all elements set to OP.  The
 776    mode of OP must be the element mode of VMODE.  If OP is a constant,
 777    then the return value will be a constant.  */
 778
 779 static rtx
 780 expand_vector_broadcast (enum machine_mode vmode, rtx op)
 781 {
 782   enum insn_code icode;
 783   rtvec vec;
 784   rtx ret;
 785   int i, n;
 786
 787   gcc_checking_assert (VECTOR_MODE_P (vmode));
 788
 789   n = GET_MODE_NUNITS (vmode);
 790   vec = rtvec_alloc (n);
 791   for (i = 0; i < n; ++i)
 792     RTVEC_ELT (vec, i) = op;
 793
 794   if (CONSTANT_P (op))
 795     return gen_rtx_CONST_VECTOR (vmode, vec);
 796
 797   /* ??? If the target doesn't have a vec_init, then we have no easy way
 798      of performing this operation.  Most of this sort of generic support
 799      is hidden away in the vector lowering support in gimple.  */
 800   icode = optab_handler (vec_init_optab, vmode);
 801   if (icode == CODE_FOR_nothing)
 802     return NULL;
 803
 804   ret = gen_reg_rtx (vmode);
 805   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 806
 807   return ret;
 808 }
 809
 810 /* This subroutine of expand_doubleword_shift handles the cases in which
 811    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 812    value are the same as for the parent routine, except that SUPERWORD_OP1
 813    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 814    INTO_TARGET may be null if the caller has decided to calculate it.  */
 815
 816 static bool
 817 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 818                         rtx outof_target, rtx into_target,
 819                         int unsignedp, enum optab_methods methods)
 820 {
 821   if (into_target != 0)
 822     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 823                              into_target, unsignedp, methods))
 824       return false;
 825
 826   if (outof_target != 0)
 827     {
 828       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 829          of the sign bit, otherwise we must fill it with zeros.  */
 830       if (binoptab != ashr_optab)
 831         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 832       else
 833         if (!force_expand_binop (word_mode, binoptab,
 834                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 835                                  outof_target, unsignedp, methods))
 836           return false;
 837     }
 838   return true;
 839 }
 840
 841 /* This subroutine of expand_doubleword_shift handles the cases in which
 842    the effective shift value is < BITS_PER_WORD.  The arguments and return
 843    value are the same as for the parent routine.  */
 844
 845 static bool
 846 expand_subword_shift (enum machine_mode op1_mode, optab binoptab,
 847                       rtx outof_input, rtx into_input, rtx op1,
 848                       rtx outof_target, rtx into_target,
 849                       int unsignedp, enum optab_methods methods,
 850                       unsigned HOST_WIDE_INT shift_mask)
 851 {
 852   optab reverse_unsigned_shift, unsigned_shift;
 853   rtx tmp, carries;
 854
 855   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 856   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 857
 858   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 859      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 860      the opposite direction to BINOPTAB.  */
 861   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 862     {
 863       carries = outof_input;
 864       tmp = immed_double_const (BITS_PER_WORD, 0, op1_mode);
 865       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 866                                    0, true, methods);
 867     }
 868   else
 869     {
 870       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 871          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 872          has unknown behavior.  Do a single shift first, then shift by the
 873          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 874          are truncated to the mode size.  */
 875       carries = expand_binop (word_mode, reverse_unsigned_shift,
 876                               outof_input, const1_rtx, 0, unsignedp, methods);
 877       if (shift_mask == BITS_PER_WORD - 1)
 878         {
 879           tmp = immed_double_const (-1, -1, op1_mode);
 880           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 881                                        0, true, methods);
 882         }
 883       else
 884         {
 885           tmp = immed_double_const (BITS_PER_WORD - 1, 0, op1_mode);
 886           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 887                                        0, true, methods);
 888         }
 889     }
 890   if (tmp == 0 || carries == 0)
 891     return false;
 892   carries = expand_binop (word_mode, reverse_unsigned_shift,
 893                           carries, tmp, 0, unsignedp, methods);
 894   if (carries == 0)
 895     return false;
 896
 897   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 898      so the result can go directly into INTO_TARGET if convenient.  */
 899   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 900                       into_target, unsignedp, methods);
 901   if (tmp == 0)
 902     return false;
 903
 904   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 905   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 906                            into_target, unsignedp, methods))
 907     return false;
 908
 909   /* Use a standard word_mode shift for the out-of half.  */
 910   if (outof_target != 0)
 911     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 912                              outof_target, unsignedp, methods))
 913       return false;
 914
 915   return true;
 916 }
 917
 918
 919 #ifdef HAVE_conditional_move
 920 /* Try implementing expand_doubleword_shift using conditional moves.
 921    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 922    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 923    are the shift counts to use in the former and latter case.  All other
 924    arguments are the same as the parent routine.  */
 925
 926 static bool
 927 expand_doubleword_shift_condmove (enum machine_mode op1_mode, optab binoptab,
 928                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 929                                   rtx outof_input, rtx into_input,
 930                                   rtx subword_op1, rtx superword_op1,
 931                                   rtx outof_target, rtx into_target,
 932                                   int unsignedp, enum optab_methods methods,
 933                                   unsigned HOST_WIDE_INT shift_mask)
 934 {
 935   rtx outof_superword, into_superword;
 936
 937   /* Put the superword version of the output into OUTOF_SUPERWORD and
 938      INTO_SUPERWORD.  */
 939   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 940   if (outof_target != 0 && subword_op1 == superword_op1)
 941     {
 942       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 943          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 944       into_superword = outof_target;
 945       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 946                                    outof_superword, 0, unsignedp, methods))
 947         return false;
 948     }
 949   else
 950     {
 951       into_superword = gen_reg_rtx (word_mode);
 952       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 953                                    outof_superword, into_superword,
 954                                    unsignedp, methods))
 955         return false;
 956     }
 957
 958   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 959   if (!expand_subword_shift (op1_mode, binoptab,
 960                              outof_input, into_input, subword_op1,
 961                              outof_target, into_target,
 962                              unsignedp, methods, shift_mask))
 963     return false;
 964
 965   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 966      might be the current value of OUTOF_TARGET.  */
 967   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 968                               into_target, into_superword, word_mode, false))
 969     return false;
 970
 971   if (outof_target != 0)
 972     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 973                                 outof_target, outof_superword,
 974                                 word_mode, false))
 975       return false;
 976
 977   return true;
 978 }
 979 #endif
 980
 981 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 982    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 983    input operand; the shift moves bits in the direction OUTOF_INPUT->
 984    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 985    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 986    If OP1 is constant, it will have been truncated as appropriate
 987    and is known to be nonzero.
 988
 989    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 990    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 991    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 992
 993    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 994    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 995    fill with zeros or sign bits as appropriate.
 996
 997    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 998    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 999    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
1000    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
1001    are undefined.
1002
1003    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
1004    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
1005    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
1006    function wants to calculate it itself.
1007
1008    Return true if the shift could be successfully synthesized.  */
1009
1010 static bool
1011 expand_doubleword_shift (enum machine_mode op1_mode, optab binoptab,
1012                          rtx outof_input, rtx into_input, rtx op1,
1013                          rtx outof_target, rtx into_target,
1014                          int unsignedp, enum optab_methods methods,
1015                          unsigned HOST_WIDE_INT shift_mask)
1016 {
1017   rtx superword_op1, tmp, cmp1, cmp2;
1018   rtx subword_label, done_label;
1019   enum rtx_code cmp_code;
1020
1021   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
1022      fill the result with sign or zero bits as appropriate.  If so, the value
1023      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
1024      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
1025      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
1026
1027      This isn't worthwhile for constant shifts since the optimizers will
1028      cope better with in-range shift counts.  */
1029   if (shift_mask >= BITS_PER_WORD
1030       && outof_target != 0
1031       && !CONSTANT_P (op1))
1032     {
1033       if (!expand_doubleword_shift (op1_mode, binoptab,
1034                                     outof_input, into_input, op1,
1035                                     0, into_target,
1036                                     unsignedp, methods, shift_mask))
1037         return false;
1038       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
1039                                outof_target, unsignedp, methods))
1040         return false;
1041       return true;
1042     }
1043
1044   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
1045      is true when the effective shift value is less than BITS_PER_WORD.
1046      Set SUPERWORD_OP1 to the shift count that should be used to shift
1047      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
1048   tmp = immed_double_const (BITS_PER_WORD, 0, op1_mode);
1049   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
1050     {
1051       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
1052          is a subword shift count.  */
1053       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
1054                                     0, true, methods);
1055       cmp2 = CONST0_RTX (op1_mode);
1056       cmp_code = EQ;
1057       superword_op1 = op1;
1058     }
1059   else
1060     {
1061       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
1062       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
1063                                     0, true, methods);
1064       cmp2 = CONST0_RTX (op1_mode);
1065       cmp_code = LT;
1066       superword_op1 = cmp1;
1067     }
1068   if (cmp1 == 0)
1069     return false;
1070
1071   /* If we can compute the condition at compile time, pick the
1072      appropriate subroutine.  */
1073   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
1074   if (tmp != 0 && CONST_INT_P (tmp))
1075     {
1076       if (tmp == const0_rtx)
1077         return expand_superword_shift (binoptab, outof_input, superword_op1,
1078                                        outof_target, into_target,
1079                                        unsignedp, methods);
1080       else
1081         return expand_subword_shift (op1_mode, binoptab,
1082                                      outof_input, into_input, op1,
1083                                      outof_target, into_target,
1084                                      unsignedp, methods, shift_mask);
1085     }
1086
1087 #ifdef HAVE_conditional_move
1088   /* Try using conditional moves to generate straight-line code.  */
1089   {
1090     rtx start = get_last_insn ();
1091     if (expand_doubleword_shift_condmove (op1_mode, binoptab,
1092                                           cmp_code, cmp1, cmp2,
1093                                           outof_input, into_input,
1094                                           op1, superword_op1,
1095                                           outof_target, into_target,
1096                                           unsignedp, methods, shift_mask))
1097       return true;
1098     delete_insns_since (start);
1099   }
1100 #endif
1101
1102   /* As a last resort, use branches to select the correct alternative.  */
1103   subword_label = gen_label_rtx ();
1104   done_label = gen_label_rtx ();
1105
1106   NO_DEFER_POP;
1107   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
1108                            0, 0, subword_label, -1);
1109   OK_DEFER_POP;
1110
1111   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
1112                                outof_target, into_target,
1113                                unsignedp, methods))
1114     return false;
1115
1116   emit_jump_insn (gen_jump (done_label));
1117   emit_barrier ();
1118   emit_label (subword_label);
1119
1120   if (!expand_subword_shift (op1_mode, binoptab,
1121                              outof_input, into_input, op1,
1122                              outof_target, into_target,
1123                              unsignedp, methods, shift_mask))
1124     return false;
1125
1126   emit_label (done_label);
1127   return true;
1128 }
1129 \f
1130 /* Subroutine of expand_binop.  Perform a double word multiplication of
1131    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
1132    as the target's word_mode.  This function return NULL_RTX if anything
1133    goes wrong, in which case it may have already emitted instructions
1134    which need to be deleted.
1135
1136    If we want to multiply two two-word values and have normal and widening
1137    multiplies of single-word values, we can do this with three smaller
1138    multiplications.
1139
1140    The multiplication proceeds as follows:
1141                                  _______________________
1142                                 [__op0_high_|__op0_low__]
1143                                  _______________________
1144         *                       [__op1_high_|__op1_low__]
1145         _______________________________________________
1146                                  _______________________
1147     (1)                         [__op0_low__*__op1_low__]
1148                      _______________________
1149     (2a)            [__op0_low__*__op1_high_]
1150                      _______________________
1151     (2b)            [__op0_high_*__op1_low__]
1152          _______________________
1153     (3) [__op0_high_*__op1_high_]
1154
1155
1156   This gives a 4-word result.  Since we are only interested in the
1157   lower 2 words, partial result (3) and the upper words of (2a) and
1158   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
1159   calculated using non-widening multiplication.
1160
1161   (1), however, needs to be calculated with an unsigned widening
1162   multiplication.  If this operation is not directly supported we
1163   try using a signed widening multiplication and adjust the result.
1164   This adjustment works as follows:
1165
1166       If both operands are positive then no adjustment is needed.
1167
1168       If the operands have different signs, for example op0_low < 0 and
1169       op1_low >= 0, the instruction treats the most significant bit of
1170       op0_low as a sign bit instead of a bit with significance
1171       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
1172       with 2**BITS_PER_WORD - op0_low, and two's complements the
1173       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
1174       the result.
1175
1176       Similarly, if both operands are negative, we need to add
1177       (op0_low + op1_low) * 2**BITS_PER_WORD.
1178
1179       We use a trick to adjust quickly.  We logically shift op0_low right
1180       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
1181       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
1182       logical shift exists, we do an arithmetic right shift and subtract
1183       the 0 or -1.  */
1184
1185 static rtx
1186 expand_doubleword_mult (enum machine_mode mode, rtx op0, rtx op1, rtx target,
1187                        bool umulp, enum optab_methods methods)
1188 {
1189   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
1190   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
1191   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
1192   rtx product, adjust, product_high, temp;
1193
1194   rtx op0_high = operand_subword_force (op0, high, mode);
1195   rtx op0_low = operand_subword_force (op0, low, mode);
1196   rtx op1_high = operand_subword_force (op1, high, mode);
1197   rtx op1_low = operand_subword_force (op1, low, mode);
1198
1199   /* If we're using an unsigned multiply to directly compute the product
1200      of the low-order words of the operands and perform any required
1201      adjustments of the operands, we begin by trying two more multiplications
1202      and then computing the appropriate sum.
1203
1204      We have checked above that the required addition is provided.
1205      Full-word addition will normally always succeed, especially if
1206      it is provided at all, so we don't worry about its failure.  The
1207      multiplication may well fail, however, so we do handle that.  */
1208
1209   if (!umulp)
1210     {
1211       /* ??? This could be done with emit_store_flag where available.  */
1212       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
1213                            NULL_RTX, 1, methods);
1214       if (temp)
1215         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
1216                                  NULL_RTX, 0, OPTAB_DIRECT);
1217       else
1218         {
1219           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
1220                                NULL_RTX, 0, methods);
1221           if (!temp)
1222             return NULL_RTX;
1223           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
1224                                    NULL_RTX, 0, OPTAB_DIRECT);
1225         }
1226
1227       if (!op0_high)
1228         return NULL_RTX;
1229     }
1230
1231   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
1232                          NULL_RTX, 0, OPTAB_DIRECT);
1233   if (!adjust)
1234     return NULL_RTX;
1235
1236   /* OP0_HIGH should now be dead.  */
1237
1238   if (!umulp)
1239     {
1240       /* ??? This could be done with emit_store_flag where available.  */
1241       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
1242                            NULL_RTX, 1, methods);
1243       if (temp)
1244         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
1245                                  NULL_RTX, 0, OPTAB_DIRECT);
1246       else
1247         {
1248           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
1249                                NULL_RTX, 0, methods);
1250           if (!temp)
1251             return NULL_RTX;
1252           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
1253                                    NULL_RTX, 0, OPTAB_DIRECT);
1254         }
1255
1256       if (!op1_high)
1257         return NULL_RTX;
1258     }
1259
1260   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
1261                        NULL_RTX, 0, OPTAB_DIRECT);
1262   if (!temp)
1263     return NULL_RTX;
1264
1265   /* OP1_HIGH should now be dead.  */
1266
1267   adjust = expand_binop (word_mode, add_optab, adjust, temp,
1268                          NULL_RTX, 0, OPTAB_DIRECT);
1269
1270   if (target && !REG_P (target))
1271     target = NULL_RTX;
1272
1273   if (umulp)
1274     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
1275                             target, 1, OPTAB_DIRECT);
1276   else
1277     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
1278                             target, 1, OPTAB_DIRECT);
1279
1280   if (!product)
1281     return NULL_RTX;
1282
1283   product_high = operand_subword (product, high, 1, mode);
1284   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
1285                          NULL_RTX, 0, OPTAB_DIRECT);
1286   emit_move_insn (product_high, adjust);
1287   return product;
1288 }
1289 \f
1290 /* Wrapper around expand_binop which takes an rtx code to specify
1291    the operation to perform, not an optab pointer.  All other
1292    arguments are the same.  */
1293 rtx
1294 expand_simple_binop (enum machine_mode mode, enum rtx_code code, rtx op0,
1295                      rtx op1, rtx target, int unsignedp,
1296                      enum optab_methods methods)
1297 {
1298   optab binop = code_to_optab (code);
1299   gcc_assert (binop);
1300
1301   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
1302 }
1303
1304 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
1305    binop.  Order them according to commutative_operand_precedence and, if
1306    possible, try to put TARGET or a pseudo first.  */
1307 static bool
1308 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
1309 {
1310   int op0_prec = commutative_operand_precedence (op0);
1311   int op1_prec = commutative_operand_precedence (op1);
1312
1313   if (op0_prec < op1_prec)
1314     return true;
1315
1316   if (op0_prec > op1_prec)
1317     return false;
1318
1319   /* With equal precedence, both orders are ok, but it is better if the
1320      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
1321   if (target == 0 || REG_P (target))
1322     return (REG_P (op1) && !REG_P (op0)) || target == op1;
1323   else
1324     return rtx_equal_p (op1, target);
1325 }
1326
1327 /* Return true if BINOPTAB implements a shift operation.  */
1328
1329 static bool
1330 shift_optab_p (optab binoptab)
1331 {
1332   switch (optab_to_code (binoptab))
1333     {
1334     case ASHIFT:
1335     case SS_ASHIFT:
1336     case US_ASHIFT:
1337     case ASHIFTRT:
1338     case LSHIFTRT:
1339     case ROTATE:
1340     case ROTATERT:
1341       return true;
1342
1343     default:
1344       return false;
1345     }
1346 }
1347
1348 /* Return true if BINOPTAB implements a commutative binary operation.  */
1349
1350 static bool
1351 commutative_optab_p (optab binoptab)
1352 {
1353   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
1354           || binoptab == smul_widen_optab
1355           || binoptab == umul_widen_optab
1356           || binoptab == smul_highpart_optab
1357           || binoptab == umul_highpart_optab);
1358 }
1359
1360 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
1361    optimizing, and if the operand is a constant that costs more than
1362    1 instruction, force the constant into a register and return that
1363    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
1364
1365 static rtx
1366 avoid_expensive_constant (enum machine_mode mode, optab binoptab,
1367                           int opn, rtx x, bool unsignedp)
1368 {
1369   bool speed = optimize_insn_for_speed_p ();
1370
1371   if (mode != VOIDmode
1372       && optimize
1373       && CONSTANT_P (x)
1374       && (rtx_cost (x, optab_to_code (binoptab), opn, speed)
1375           > set_src_cost (x, speed)))
1376     {
1377       if (CONST_INT_P (x))
1378         {
1379           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
1380           if (intval != INTVAL (x))
1381             x = GEN_INT (intval);
1382         }
1383       else
1384         x = convert_modes (mode, VOIDmode, x, unsignedp);
1385       x = force_reg (mode, x);
1386     }
1387   return x;
1388 }
1389
1390 /* Helper function for expand_binop: handle the case where there
1391    is an insn that directly implements the indicated operation.
1392    Returns null if this is not possible.  */
1393 static rtx
1394 expand_binop_directly (enum machine_mode mode, optab binoptab,
1395                        rtx op0, rtx op1,
1396                        rtx target, int unsignedp, enum optab_methods methods,
1397                        rtx last)
1398 {
1399   enum machine_mode from_mode = widened_mode (mode, op0, op1);
1400   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
1401                                                       from_mode, 1);
1402   enum machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1403   enum machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1404   enum machine_mode mode0, mode1, tmp_mode;
1405   struct expand_operand ops[3];
1406   bool commutative_p;
1407   rtx pat;
1408   rtx xop0 = op0, xop1 = op1;
1409   rtx swap;
1410
1411   /* If it is a commutative operator and the modes would match
1412      if we would swap the operands, we can save the conversions.  */
1413   commutative_p = commutative_optab_p (binoptab);
1414   if (commutative_p
1415       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1416       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1417     {
1418       swap = xop0;
1419       xop0 = xop1;
1420       xop1 = swap;
1421     }
1422
1423   /* If we are optimizing, force expensive constants into a register.  */
1424   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1425   if (!shift_optab_p (binoptab))
1426     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1427
1428   /* In case the insn wants input operands in modes different from
1429      those of the actual operands, convert the operands.  It would
1430      seem that we don't need to convert CONST_INTs, but we do, so
1431      that they're properly zero-extended, sign-extended or truncated
1432      for their mode.  */
1433
1434   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1435   if (xmode0 != VOIDmode && xmode0 != mode0)
1436     {
1437       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1438       mode0 = xmode0;
1439     }
1440
1441   mode1 = GET_MODE (xop1) != VOIDmode ? GET_MODE (xop1) : mode;
1442   if (xmode1 != VOIDmode && xmode1 != mode1)
1443     {
1444       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1445       mode1 = xmode1;
1446     }
1447
1448   /* If operation is commutative,
1449      try to make the first operand a register.
1450      Even better, try to make it the same as the target.
1451      Also try to make the last operand a constant.  */
1452   if (commutative_p
1453       && swap_commutative_operands_with_target (target, xop0, xop1))
1454     {
1455       swap = xop1;
1456       xop1 = xop0;
1457       xop0 = swap;
1458     }
1459
1460   /* Now, if insn's predicates don't allow our operands, put them into
1461      pseudo regs.  */
1462
1463   if (binoptab == vec_pack_trunc_optab
1464       || binoptab == vec_pack_usat_optab
1465       || binoptab == vec_pack_ssat_optab
1466       || binoptab == vec_pack_ufix_trunc_optab
1467       || binoptab == vec_pack_sfix_trunc_optab)
1468     {
1469       /* The mode of the result is different then the mode of the
1470          arguments.  */
1471       tmp_mode = insn_data[(int) icode].operand[0].mode;
1472       if (GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1473         {
1474           delete_insns_since (last);
1475           return NULL_RTX;
1476         }
1477     }
1478   else
1479     tmp_mode = mode;
1480
1481   create_output_operand (&ops[0], target, tmp_mode);
1482   create_input_operand (&ops[1], xop0, mode0);
1483   create_input_operand (&ops[2], xop1, mode1);
1484   pat = maybe_gen_insn (icode, 3, ops);
1485   if (pat)
1486     {
1487       /* If PAT is composed of more than one insn, try to add an appropriate
1488          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1489          operand, call expand_binop again, this time without a target.  */
1490       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1491           && ! add_equal_note (pat, ops[0].value, optab_to_code (binoptab),
1492                                ops[1].value, ops[2].value))
1493         {
1494           delete_insns_since (last);
1495           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1496                                unsignedp, methods);
1497         }
1498
1499       emit_insn (pat);
1500       return ops[0].value;
1501     }
1502   delete_insns_since (last);
1503   return NULL_RTX;
1504 }
1505
1506 /* Generate code to perform an operation specified by BINOPTAB
1507    on operands OP0 and OP1, with result having machine-mode MODE.
1508
1509    UNSIGNEDP is for the case where we have to widen the operands
1510    to perform the operation.  It says to use zero-extension.
1511
1512    If TARGET is nonzero, the value
1513    is generated there, if it is convenient to do so.
1514    In all cases an rtx is returned for the locus of the value;
1515    this may or may not be TARGET.  */
1516
1517 rtx
1518 expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
1519               rtx target, int unsignedp, enum optab_methods methods)
1520 {
1521   enum optab_methods next_methods
1522     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1523        ? OPTAB_WIDEN : methods);
1524   enum mode_class mclass;
1525   enum machine_mode wider_mode;
1526   rtx libfunc;
1527   rtx temp;
1528   rtx entry_last = get_last_insn ();
1529   rtx last;
1530
1531   mclass = GET_MODE_CLASS (mode);
1532
1533   /* If subtracting an integer constant, convert this into an addition of
1534      the negated constant.  */
1535
1536   if (binoptab == sub_optab && CONST_INT_P (op1))
1537     {
1538       op1 = negate_rtx (mode, op1);
1539       binoptab = add_optab;
1540     }
1541
1542   /* Record where to delete back to if we backtrack.  */
1543   last = get_last_insn ();
1544
1545   /* If we can do it with a three-operand insn, do so.  */
1546
1547   if (methods != OPTAB_MUST_WIDEN
1548       && find_widening_optab_handler (binoptab, mode,
1549                                       widened_mode (mode, op0, op1), 1)
1550             != CODE_FOR_nothing)
1551     {
1552       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1553                                     unsignedp, methods, last);
1554       if (temp)
1555         return temp;
1556     }
1557
1558   /* If we were trying to rotate, and that didn't work, try rotating
1559      the other direction before falling back to shifts and bitwise-or.  */
1560   if (((binoptab == rotl_optab
1561         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1562        || (binoptab == rotr_optab
1563            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1564       && mclass == MODE_INT)
1565     {
1566       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1567       rtx newop1;
1568       unsigned int bits = GET_MODE_PRECISION (mode);
1569
1570       if (CONST_INT_P (op1))
1571         newop1 = GEN_INT (bits - INTVAL (op1));
1572       else if (targetm.shift_truncation_mask (mode) == bits - 1)
1573         newop1 = negate_rtx (GET_MODE (op1), op1);
1574       else
1575         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1576                                gen_int_mode (bits, GET_MODE (op1)), op1,
1577                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1578
1579       temp = expand_binop_directly (mode, otheroptab, op0, newop1,
1580                                     target, unsignedp, methods, last);
1581       if (temp)
1582         return temp;
1583     }
1584
1585   /* If this is a multiply, see if we can do a widening operation that
1586      takes operands of this mode and makes a wider mode.  */
1587
1588   if (binoptab == smul_optab
1589       && GET_MODE_2XWIDER_MODE (mode) != VOIDmode
1590       && (widening_optab_handler ((unsignedp ? umul_widen_optab
1591                                              : smul_widen_optab),
1592                                   GET_MODE_2XWIDER_MODE (mode), mode)
1593           != CODE_FOR_nothing))
1594     {
1595       temp = expand_binop (GET_MODE_2XWIDER_MODE (mode),
1596                            unsignedp ? umul_widen_optab : smul_widen_optab,
1597                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1598
1599       if (temp != 0)
1600         {
1601           if (GET_MODE_CLASS (mode) == MODE_INT
1602               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1603             return gen_lowpart (mode, temp);
1604           else
1605             return convert_to_mode (mode, temp, unsignedp);
1606         }
1607     }
1608
1609   /* If this is a vector shift by a scalar, see if we can do a vector
1610      shift by a vector.  If so, broadcast the scalar into a vector.  */
1611   if (mclass == MODE_VECTOR_INT)
1612     {
1613       optab otheroptab = unknown_optab;
1614
1615       if (binoptab == ashl_optab)
1616         otheroptab = vashl_optab;
1617       else if (binoptab == ashr_optab)
1618         otheroptab = vashr_optab;
1619       else if (binoptab == lshr_optab)
1620         otheroptab = vlshr_optab;
1621       else if (binoptab == rotl_optab)
1622         otheroptab = vrotl_optab;
1623       else if (binoptab == rotr_optab)
1624         otheroptab = vrotr_optab;
1625
1626       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1627         {
1628           rtx vop1 = expand_vector_broadcast (mode, op1);
1629           if (vop1)
1630             {
1631               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1632                                             target, unsignedp, methods, last);
1633               if (temp)
1634                 return temp;
1635             }
1636         }
1637     }
1638
1639   /* Look for a wider mode of the same class for which we think we
1640      can open-code the operation.  Check for a widening multiply at the
1641      wider mode as well.  */
1642
1643   if (CLASS_HAS_WIDER_MODES_P (mclass)
1644       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1645     for (wider_mode = GET_MODE_WIDER_MODE (mode);
1646          wider_mode != VOIDmode;
1647          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
1648       {
1649         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1650             || (binoptab == smul_optab
1651                 && GET_MODE_WIDER_MODE (wider_mode) != VOIDmode
1652                 && (find_widening_optab_handler ((unsignedp
1653                                                   ? umul_widen_optab
1654                                                   : smul_widen_optab),
1655                                                  GET_MODE_WIDER_MODE (wider_mode),
1656                                                  mode, 0)
1657                     != CODE_FOR_nothing)))
1658           {
1659             rtx xop0 = op0, xop1 = op1;
1660             int no_extend = 0;
1661
1662             /* For certain integer operations, we need not actually extend
1663                the narrow operands, as long as we will truncate
1664                the results to the same narrowness.  */
1665
1666             if ((binoptab == ior_optab || binoptab == and_optab
1667                  || binoptab == xor_optab
1668                  || binoptab == add_optab || binoptab == sub_optab
1669                  || binoptab == smul_optab || binoptab == ashl_optab)
1670                 && mclass == MODE_INT)
1671               {
1672                 no_extend = 1;
1673                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1674                                                  xop0, unsignedp);
1675                 if (binoptab != ashl_optab)
1676                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1677                                                    xop1, unsignedp);
1678               }
1679
1680             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1681
1682             /* The second operand of a shift must always be extended.  */
1683             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1684                                   no_extend && binoptab != ashl_optab);
1685
1686             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1687                                  unsignedp, OPTAB_DIRECT);
1688             if (temp)
1689               {
1690                 if (mclass != MODE_INT
1691                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1692                   {
1693                     if (target == 0)
1694                       target = gen_reg_rtx (mode);
1695                     convert_move (target, temp, 0);
1696                     return target;
1697                   }
1698                 else
1699                   return gen_lowpart (mode, temp);
1700               }
1701             else
1702               delete_insns_since (last);
1703           }
1704       }
1705
1706   /* If operation is commutative,
1707      try to make the first operand a register.
1708      Even better, try to make it the same as the target.
1709      Also try to make the last operand a constant.  */
1710   if (commutative_optab_p (binoptab)
1711       && swap_commutative_operands_with_target (target, op0, op1))
1712     {
1713       temp = op1;
1714       op1 = op0;
1715       op0 = temp;
1716     }
1717
1718   /* These can be done a word at a time.  */
1719   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1720       && mclass == MODE_INT
1721       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
1722       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1723     {
1724       int i;
1725       rtx insns;
1726
1727       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1728          won't be accurate, so use a new target.  */
1729       if (target == 0
1730           || target == op0
1731           || target == op1
1732           || !valid_multiword_target_p (target))
1733         target = gen_reg_rtx (mode);
1734
1735       start_sequence ();
1736
1737       /* Do the actual arithmetic.  */
1738       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
1739         {
1740           rtx target_piece = operand_subword (target, i, 1, mode);
1741           rtx x = expand_binop (word_mode, binoptab,
1742                                 operand_subword_force (op0, i, mode),
1743                                 operand_subword_force (op1, i, mode),
1744                                 target_piece, unsignedp, next_methods);
1745
1746           if (x == 0)
1747             break;
1748
1749           if (target_piece != x)
1750             emit_move_insn (target_piece, x);
1751         }
1752
1753       insns = get_insns ();
1754       end_sequence ();
1755
1756       if (i == GET_MODE_BITSIZE (mode) / BITS_PER_WORD)
1757         {
1758           emit_insn (insns);
1759           return target;
1760         }
1761     }
1762
1763   /* Synthesize double word shifts from single word shifts.  */
1764   if ((binoptab == lshr_optab || binoptab == ashl_optab
1765        || binoptab == ashr_optab)
1766       && mclass == MODE_INT
1767       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1768       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1769       && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode)
1770       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1771       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1772       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1773     {
1774       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1775       enum machine_mode op1_mode;
1776
1777       double_shift_mask = targetm.shift_truncation_mask (mode);
1778       shift_mask = targetm.shift_truncation_mask (word_mode);
1779       op1_mode = GET_MODE (op1) != VOIDmode ? GET_MODE (op1) : word_mode;
1780
1781       /* Apply the truncation to constant shifts.  */
1782       if (double_shift_mask > 0 && CONST_INT_P (op1))
1783         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1784
1785       if (op1 == CONST0_RTX (op1_mode))
1786         return op0;
1787
1788       /* Make sure that this is a combination that expand_doubleword_shift
1789          can handle.  See the comments there for details.  */
1790       if (double_shift_mask == 0
1791           || (shift_mask == BITS_PER_WORD - 1
1792               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1793         {
1794           rtx insns;
1795           rtx into_target, outof_target;
1796           rtx into_input, outof_input;
1797           int left_shift, outof_word;
1798
1799           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1800              won't be accurate, so use a new target.  */
1801           if (target == 0
1802               || target == op0
1803               || target == op1
1804               || !valid_multiword_target_p (target))
1805             target = gen_reg_rtx (mode);
1806
1807           start_sequence ();
1808
1809           /* OUTOF_* is the word we are shifting bits away from, and
1810              INTO_* is the word that we are shifting bits towards, thus
1811              they differ depending on the direction of the shift and
1812              WORDS_BIG_ENDIAN.  */
1813
1814           left_shift = binoptab == ashl_optab;
1815           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1816
1817           outof_target = operand_subword (target, outof_word, 1, mode);
1818           into_target = operand_subword (target, 1 - outof_word, 1, mode);
1819
1820           outof_input = operand_subword_force (op0, outof_word, mode);
1821           into_input = operand_subword_force (op0, 1 - outof_word, mode);
1822
1823           if (expand_doubleword_shift (op1_mode, binoptab,
1824                                        outof_input, into_input, op1,
1825                                        outof_target, into_target,
1826                                        unsignedp, next_methods, shift_mask))
1827             {
1828               insns = get_insns ();
1829               end_sequence ();
1830
1831               emit_insn (insns);
1832               return target;
1833             }
1834           end_sequence ();
1835         }
1836     }
1837
1838   /* Synthesize double word rotates from single word shifts.  */
1839   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1840       && mclass == MODE_INT
1841       && CONST_INT_P (op1)
1842       && GET_MODE_PRECISION (mode) == 2 * BITS_PER_WORD
1843       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1844       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1845     {
1846       rtx insns;
1847       rtx into_target, outof_target;
1848       rtx into_input, outof_input;
1849       rtx inter;
1850       int shift_count, left_shift, outof_word;
1851
1852       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1853          won't be accurate, so use a new target. Do this also if target is not
1854          a REG, first because having a register instead may open optimization
1855          opportunities, and second because if target and op0 happen to be MEMs
1856          designating the same location, we would risk clobbering it too early
1857          in the code sequence we generate below.  */
1858       if (target == 0
1859           || target == op0
1860           || target == op1
1861           || !REG_P (target)
1862           || !valid_multiword_target_p (target))
1863         target = gen_reg_rtx (mode);
1864
1865       start_sequence ();
1866
1867       shift_count = INTVAL (op1);
1868
1869       /* OUTOF_* is the word we are shifting bits away from, and
1870          INTO_* is the word that we are shifting bits towards, thus
1871          they differ depending on the direction of the shift and
1872          WORDS_BIG_ENDIAN.  */
1873
1874       left_shift = (binoptab == rotl_optab);
1875       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1876
1877       outof_target = operand_subword (target, outof_word, 1, mode);
1878       into_target = operand_subword (target, 1 - outof_word, 1, mode);
1879
1880       outof_input = operand_subword_force (op0, outof_word, mode);
1881       into_input = operand_subword_force (op0, 1 - outof_word, mode);
1882
1883       if (shift_count == BITS_PER_WORD)
1884         {
1885           /* This is just a word swap.  */
1886           emit_move_insn (outof_target, into_input);
1887           emit_move_insn (into_target, outof_input);
1888           inter = const0_rtx;
1889         }
1890       else
1891         {
1892           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1893           rtx first_shift_count, second_shift_count;
1894           optab reverse_unsigned_shift, unsigned_shift;
1895
1896           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1897                                     ? lshr_optab : ashl_optab);
1898
1899           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1900                             ? ashl_optab : lshr_optab);
1901
1902           if (shift_count > BITS_PER_WORD)
1903             {
1904               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1905               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1906             }
1907           else
1908             {
1909               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1910               second_shift_count = GEN_INT (shift_count);
1911             }
1912
1913           into_temp1 = expand_binop (word_mode, unsigned_shift,
1914                                      outof_input, first_shift_count,
1915                                      NULL_RTX, unsignedp, next_methods);
1916           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1917                                      into_input, second_shift_count,
1918                                      NULL_RTX, unsignedp, next_methods);
1919
1920           if (into_temp1 != 0 && into_temp2 != 0)
1921             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1922                                   into_target, unsignedp, next_methods);
1923           else
1924             inter = 0;
1925
1926           if (inter != 0 && inter != into_target)
1927             emit_move_insn (into_target, inter);
1928
1929           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1930                                       into_input, first_shift_count,
1931                                       NULL_RTX, unsignedp, next_methods);
1932           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1933                                       outof_input, second_shift_count,
1934                                       NULL_RTX, unsignedp, next_methods);
1935
1936           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1937             inter = expand_binop (word_mode, ior_optab,
1938                                   outof_temp1, outof_temp2,
1939                                   outof_target, unsignedp, next_methods);
1940
1941           if (inter != 0 && inter != outof_target)
1942             emit_move_insn (outof_target, inter);
1943         }
1944
1945       insns = get_insns ();
1946       end_sequence ();
1947
1948       if (inter != 0)
1949         {
1950           emit_insn (insns);
1951           return target;
1952         }
1953     }
1954
1955   /* These can be done a word at a time by propagating carries.  */
1956   if ((binoptab == add_optab || binoptab == sub_optab)
1957       && mclass == MODE_INT
1958       && GET_MODE_SIZE (mode) >= 2 * UNITS_PER_WORD
1959       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1960     {
1961       unsigned int i;
1962       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1963       const unsigned int nwords = GET_MODE_BITSIZE (mode) / BITS_PER_WORD;
1964       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1965       rtx xop0, xop1, xtarget;
1966
1967       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1968          value is one of those, use it.  Otherwise, use 1 since it is the
1969          one easiest to get.  */
1970 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1971       int normalizep = STORE_FLAG_VALUE;
1972 #else
1973       int normalizep = 1;
1974 #endif
1975
1976       /* Prepare the operands.  */
1977       xop0 = force_reg (mode, op0);
1978       xop1 = force_reg (mode, op1);
1979
1980       xtarget = gen_reg_rtx (mode);
1981
1982       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1983         target = xtarget;
1984
1985       /* Indicate for flow that the entire target reg is being set.  */
1986       if (REG_P (target))
1987         emit_clobber (xtarget);
1988
1989       /* Do the actual arithmetic.  */
1990       for (i = 0; i < nwords; i++)
1991         {
1992           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1993           rtx target_piece = operand_subword (xtarget, index, 1, mode);
1994           rtx op0_piece = operand_subword_force (xop0, index, mode);
1995           rtx op1_piece = operand_subword_force (xop1, index, mode);
1996           rtx x;
1997
1998           /* Main add/subtract of the input operands.  */
1999           x = expand_binop (word_mode, binoptab,
2000                             op0_piece, op1_piece,
2001                             target_piece, unsignedp, next_methods);
2002           if (x == 0)
2003             break;
2004
2005           if (i + 1 < nwords)
2006             {
2007               /* Store carry from main add/subtract.  */
2008               carry_out = gen_reg_rtx (word_mode);
2009               carry_out = emit_store_flag_force (carry_out,
2010                                                  (binoptab == add_optab
2011                                                   ? LT : GT),
2012                                                  x, op0_piece,
2013                                                  word_mode, 1, normalizep);
2014             }
2015
2016           if (i > 0)
2017             {
2018               rtx newx;
2019
2020               /* Add/subtract previous carry to main result.  */
2021               newx = expand_binop (word_mode,
2022                                    normalizep == 1 ? binoptab : otheroptab,
2023                                    x, carry_in,
2024                                    NULL_RTX, 1, next_methods);
2025
2026               if (i + 1 < nwords)
2027                 {
2028                   /* Get out carry from adding/subtracting carry in.  */
2029                   rtx carry_tmp = gen_reg_rtx (word_mode);
2030                   carry_tmp = emit_store_flag_force (carry_tmp,
2031                                                      (binoptab == add_optab
2032                                                       ? LT : GT),
2033                                                      newx, x,
2034                                                      word_mode, 1, normalizep);
2035
2036                   /* Logical-ior the two poss. carry together.  */
2037                   carry_out = expand_binop (word_mode, ior_optab,
2038                                             carry_out, carry_tmp,
2039                                             carry_out, 0, next_methods);
2040                   if (carry_out == 0)
2041                     break;
2042                 }
2043               emit_move_insn (target_piece, newx);
2044             }
2045           else
2046             {
2047               if (x != target_piece)
2048                 emit_move_insn (target_piece, x);
2049             }
2050
2051           carry_in = carry_out;
2052         }
2053
2054       if (i == GET_MODE_BITSIZE (mode) / (unsigned) BITS_PER_WORD)
2055         {
2056           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing
2057               || ! rtx_equal_p (target, xtarget))
2058             {
2059               rtx temp = emit_move_insn (target, xtarget);
2060
2061               set_dst_reg_note (temp, REG_EQUAL,
2062                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2063                                                 mode, copy_rtx (xop0),
2064                                                 copy_rtx (xop1)),
2065                                 target);
2066             }
2067           else
2068             target = xtarget;
2069
2070           return target;
2071         }
2072
2073       else
2074         delete_insns_since (last);
2075     }
2076
2077   /* Attempt to synthesize double word multiplies using a sequence of word
2078      mode multiplications.  We first attempt to generate a sequence using a
2079      more efficient unsigned widening multiply, and if that fails we then
2080      try using a signed widening multiply.  */
2081
2082   if (binoptab == smul_optab
2083       && mclass == MODE_INT
2084       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2085       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
2086       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
2087     {
2088       rtx product = NULL_RTX;
2089       if (widening_optab_handler (umul_widen_optab, mode, word_mode)
2090             != CODE_FOR_nothing)
2091         {
2092           product = expand_doubleword_mult (mode, op0, op1, target,
2093                                             true, methods);
2094           if (!product)
2095             delete_insns_since (last);
2096         }
2097
2098       if (product == NULL_RTX
2099           && widening_optab_handler (smul_widen_optab, mode, word_mode)
2100                 != CODE_FOR_nothing)
2101         {
2102           product = expand_doubleword_mult (mode, op0, op1, target,
2103                                             false, methods);
2104           if (!product)
2105             delete_insns_since (last);
2106         }
2107
2108       if (product != NULL_RTX)
2109         {
2110           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing)
2111             {
2112               temp = emit_move_insn (target ? target : product, product);
2113               set_dst_reg_note (temp,
2114                                 REG_EQUAL,
2115                                 gen_rtx_fmt_ee (MULT, mode,
2116                                                 copy_rtx (op0),
2117                                                 copy_rtx (op1)),
2118                                 target ? target : product);
2119             }
2120           return product;
2121         }
2122     }
2123
2124   /* It can't be open-coded in this mode.
2125      Use a library call if one is available and caller says that's ok.  */
2126
2127   libfunc = optab_libfunc (binoptab, mode);
2128   if (libfunc
2129       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
2130     {
2131       rtx insns;
2132       rtx op1x = op1;
2133       enum machine_mode op1_mode = mode;
2134       rtx value;
2135
2136       start_sequence ();
2137
2138       if (shift_optab_p (binoptab))
2139         {
2140           op1_mode = targetm.libgcc_shift_count_mode ();
2141           /* Specify unsigned here,
2142              since negative shift counts are meaningless.  */
2143           op1x = convert_to_mode (op1_mode, op1, 1);
2144         }
2145
2146       if (GET_MODE (op0) != VOIDmode
2147           && GET_MODE (op0) != mode)
2148         op0 = convert_to_mode (mode, op0, unsignedp);
2149
2150       /* Pass 1 for NO_QUEUE so we don't lose any increments
2151          if the libcall is cse'd or moved.  */
2152       value = emit_library_call_value (libfunc,
2153                                        NULL_RTX, LCT_CONST, mode, 2,
2154                                        op0, mode, op1x, op1_mode);
2155
2156       insns = get_insns ();
2157       end_sequence ();
2158
2159       target = gen_reg_rtx (mode);
2160       emit_libcall_block_1 (insns, target, value,
2161                             gen_rtx_fmt_ee (optab_to_code (binoptab),
2162                                             mode, op0, op1),
2163                             trapv_binoptab_p (binoptab));
2164
2165       return target;
2166     }
2167
2168   delete_insns_since (last);
2169
2170   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2171
2172   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
2173          || methods == OPTAB_MUST_WIDEN))
2174     {
2175       /* Caller says, don't even try.  */
2176       delete_insns_since (entry_last);
2177       return 0;
2178     }
2179
2180   /* Compute the value of METHODS to pass to recursive calls.
2181      Don't allow widening to be tried recursively.  */
2182
2183   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
2184
2185   /* Look for a wider mode of the same class for which it appears we can do
2186      the operation.  */
2187
2188   if (CLASS_HAS_WIDER_MODES_P (mclass))
2189     {
2190       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2191            wider_mode != VOIDmode;
2192            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2193         {
2194           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
2195                   != CODE_FOR_nothing
2196               || (methods == OPTAB_LIB
2197                   && optab_libfunc (binoptab, wider_mode)))
2198             {
2199               rtx xop0 = op0, xop1 = op1;
2200               int no_extend = 0;
2201
2202               /* For certain integer operations, we need not actually extend
2203                  the narrow operands, as long as we will truncate
2204                  the results to the same narrowness.  */
2205
2206               if ((binoptab == ior_optab || binoptab == and_optab
2207                    || binoptab == xor_optab
2208                    || binoptab == add_optab || binoptab == sub_optab
2209                    || binoptab == smul_optab || binoptab == ashl_optab)
2210                   && mclass == MODE_INT)
2211                 no_extend = 1;
2212
2213               xop0 = widen_operand (xop0, wider_mode, mode,
2214                                     unsignedp, no_extend);
2215
2216               /* The second operand of a shift must always be extended.  */
2217               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
2218                                     no_extend && binoptab != ashl_optab);
2219
2220               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
2221                                    unsignedp, methods);
2222               if (temp)
2223                 {
2224                   if (mclass != MODE_INT
2225                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2226                     {
2227                       if (target == 0)
2228                         target = gen_reg_rtx (mode);
2229                       convert_move (target, temp, 0);
2230                       return target;
2231                     }
2232                   else
2233                     return gen_lowpart (mode, temp);
2234                 }
2235               else
2236                 delete_insns_since (last);
2237             }
2238         }
2239     }
2240
2241   delete_insns_since (entry_last);
2242   return 0;
2243 }
2244 \f
2245 /* Expand a binary operator which has both signed and unsigned forms.
2246    UOPTAB is the optab for unsigned operations, and SOPTAB is for
2247    signed operations.
2248
2249    If we widen unsigned operands, we may use a signed wider operation instead
2250    of an unsigned wider operation, since the result would be the same.  */
2251
2252 rtx
2253 sign_expand_binop (enum machine_mode mode, optab uoptab, optab soptab,
2254                    rtx op0, rtx op1, rtx target, int unsignedp,
2255                    enum optab_methods methods)
2256 {
2257   rtx temp;
2258   optab direct_optab = unsignedp ? uoptab : soptab;
2259   bool save_enable;
2260
2261   /* Do it without widening, if possible.  */
2262   temp = expand_binop (mode, direct_optab, op0, op1, target,
2263                        unsignedp, OPTAB_DIRECT);
2264   if (temp || methods == OPTAB_DIRECT)
2265     return temp;
2266
2267   /* Try widening to a signed int.  Disable any direct use of any
2268      signed insn in the current mode.  */
2269   save_enable = swap_optab_enable (soptab, mode, false);
2270
2271   temp = expand_binop (mode, soptab, op0, op1, target,
2272                        unsignedp, OPTAB_WIDEN);
2273
2274   /* For unsigned operands, try widening to an unsigned int.  */
2275   if (!temp && unsignedp)
2276     temp = expand_binop (mode, uoptab, op0, op1, target,
2277                          unsignedp, OPTAB_WIDEN);
2278   if (temp || methods == OPTAB_WIDEN)
2279     goto egress;
2280
2281   /* Use the right width libcall if that exists.  */
2282   temp = expand_binop (mode, direct_optab, op0, op1, target,
2283                        unsignedp, OPTAB_LIB);
2284   if (temp || methods == OPTAB_LIB)
2285     goto egress;
2286
2287   /* Must widen and use a libcall, use either signed or unsigned.  */
2288   temp = expand_binop (mode, soptab, op0, op1, target,
2289                        unsignedp, methods);
2290   if (!temp && unsignedp)
2291     temp = expand_binop (mode, uoptab, op0, op1, target,
2292                          unsignedp, methods);
2293
2294  egress:
2295   /* Undo the fiddling above.  */
2296   if (save_enable)
2297     swap_optab_enable (soptab, mode, true);
2298   return temp;
2299 }
2300 \f
2301 /* Generate code to perform an operation specified by UNOPPTAB
2302    on operand OP0, with two results to TARG0 and TARG1.
2303    We assume that the order of the operands for the instruction
2304    is TARG0, TARG1, OP0.
2305
2306    Either TARG0 or TARG1 may be zero, but what that means is that
2307    the result is not actually wanted.  We will generate it into
2308    a dummy pseudo-reg and discard it.  They may not both be zero.
2309
2310    Returns 1 if this operation can be performed; 0 if not.  */
2311
2312 int
2313 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
2314                     int unsignedp)
2315 {
2316   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2317   enum mode_class mclass;
2318   enum machine_mode wider_mode;
2319   rtx entry_last = get_last_insn ();
2320   rtx last;
2321
2322   mclass = GET_MODE_CLASS (mode);
2323
2324   if (!targ0)
2325     targ0 = gen_reg_rtx (mode);
2326   if (!targ1)
2327     targ1 = gen_reg_rtx (mode);
2328
2329   /* Record where to go back to if we fail.  */
2330   last = get_last_insn ();
2331
2332   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2333     {
2334       struct expand_operand ops[3];
2335       enum insn_code icode = optab_handler (unoptab, mode);
2336
2337       create_fixed_operand (&ops[0], targ0);
2338       create_fixed_operand (&ops[1], targ1);
2339       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
2340       if (maybe_expand_insn (icode, 3, ops))
2341         return 1;
2342     }
2343
2344   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2345
2346   if (CLASS_HAS_WIDER_MODES_P (mclass))
2347     {
2348       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2349            wider_mode != VOIDmode;
2350            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2351         {
2352           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2353             {
2354               rtx t0 = gen_reg_rtx (wider_mode);
2355               rtx t1 = gen_reg_rtx (wider_mode);
2356               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2357
2358               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2359                 {
2360                   convert_move (targ0, t0, unsignedp);
2361                   convert_move (targ1, t1, unsignedp);
2362                   return 1;
2363                 }
2364               else
2365                 delete_insns_since (last);
2366             }
2367         }
2368     }
2369
2370   delete_insns_since (entry_last);
2371   return 0;
2372 }
2373 \f
2374 /* Generate code to perform an operation specified by BINOPTAB
2375    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2376    We assume that the order of the operands for the instruction
2377    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2378    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2379
2380    Either TARG0 or TARG1 may be zero, but what that means is that
2381    the result is not actually wanted.  We will generate it into
2382    a dummy pseudo-reg and discard it.  They may not both be zero.
2383
2384    Returns 1 if this operation can be performed; 0 if not.  */
2385
2386 int
2387 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2388                      int unsignedp)
2389 {
2390   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2391   enum mode_class mclass;
2392   enum machine_mode wider_mode;
2393   rtx entry_last = get_last_insn ();
2394   rtx last;
2395
2396   mclass = GET_MODE_CLASS (mode);
2397
2398   if (!targ0)
2399     targ0 = gen_reg_rtx (mode);
2400   if (!targ1)
2401     targ1 = gen_reg_rtx (mode);
2402
2403   /* Record where to go back to if we fail.  */
2404   last = get_last_insn ();
2405
2406   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2407     {
2408       struct expand_operand ops[4];
2409       enum insn_code icode = optab_handler (binoptab, mode);
2410       enum machine_mode mode0 = insn_data[icode].operand[1].mode;
2411       enum machine_mode mode1 = insn_data[icode].operand[2].mode;
2412       rtx xop0 = op0, xop1 = op1;
2413
2414       /* If we are optimizing, force expensive constants into a register.  */
2415       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2416       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2417
2418       create_fixed_operand (&ops[0], targ0);
2419       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2420       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2421       create_fixed_operand (&ops[3], targ1);
2422       if (maybe_expand_insn (icode, 4, ops))
2423         return 1;
2424       delete_insns_since (last);
2425     }
2426
2427   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2428
2429   if (CLASS_HAS_WIDER_MODES_P (mclass))
2430     {
2431       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2432            wider_mode != VOIDmode;
2433            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2434         {
2435           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2436             {
2437               rtx t0 = gen_reg_rtx (wider_mode);
2438               rtx t1 = gen_reg_rtx (wider_mode);
2439               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2440               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2441
2442               if (expand_twoval_binop (binoptab, cop0, cop1,
2443                                        t0, t1, unsignedp))
2444                 {
2445                   convert_move (targ0, t0, unsignedp);
2446                   convert_move (targ1, t1, unsignedp);
2447                   return 1;
2448                 }
2449               else
2450                 delete_insns_since (last);
2451             }
2452         }
2453     }
2454
2455   delete_insns_since (entry_last);
2456   return 0;
2457 }
2458
2459 /* Expand the two-valued library call indicated by BINOPTAB, but
2460    preserve only one of the values.  If TARG0 is non-NULL, the first
2461    value is placed into TARG0; otherwise the second value is placed
2462    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2463    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2464    This routine assumes that the value returned by the library call is
2465    as if the return value was of an integral mode twice as wide as the
2466    mode of OP0.  Returns 1 if the call was successful.  */
2467
2468 bool
2469 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2470                              rtx targ0, rtx targ1, enum rtx_code code)
2471 {
2472   enum machine_mode mode;
2473   enum machine_mode libval_mode;
2474   rtx libval;
2475   rtx insns;
2476   rtx libfunc;
2477
2478   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2479   gcc_assert (!targ0 != !targ1);
2480
2481   mode = GET_MODE (op0);
2482   libfunc = optab_libfunc (binoptab, mode);
2483   if (!libfunc)
2484     return false;
2485
2486   /* The value returned by the library function will have twice as
2487      many bits as the nominal MODE.  */
2488   libval_mode = smallest_mode_for_size (2 * GET_MODE_BITSIZE (mode),
2489                                         MODE_INT);
2490   start_sequence ();
2491   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2492                                     libval_mode, 2,
2493                                     op0, mode,
2494                                     op1, mode);
2495   /* Get the part of VAL containing the value that we want.  */
2496   libval = simplify_gen_subreg (mode, libval, libval_mode,
2497                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2498   insns = get_insns ();
2499   end_sequence ();
2500   /* Move the into the desired location.  */
2501   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2502                       gen_rtx_fmt_ee (code, mode, op0, op1));
2503
2504   return true;
2505 }
2506
2507 \f
2508 /* Wrapper around expand_unop which takes an rtx code to specify
2509    the operation to perform, not an optab pointer.  All other
2510    arguments are the same.  */
2511 rtx
2512 expand_simple_unop (enum machine_mode mode, enum rtx_code code, rtx op0,
2513                     rtx target, int unsignedp)
2514 {
2515   optab unop = code_to_optab (code);
2516   gcc_assert (unop);
2517
2518   return expand_unop (mode, unop, op0, target, unsignedp);
2519 }
2520
2521 /* Try calculating
2522         (clz:narrow x)
2523    as
2524         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2525
2526    A similar operation can be used for clrsb.  UNOPTAB says which operation
2527    we are trying to expand.  */
2528 static rtx
2529 widen_leading (enum machine_mode mode, rtx op0, rtx target, optab unoptab)
2530 {
2531   enum mode_class mclass = GET_MODE_CLASS (mode);
2532   if (CLASS_HAS_WIDER_MODES_P (mclass))
2533     {
2534       enum machine_mode wider_mode;
2535       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2536            wider_mode != VOIDmode;
2537            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2538         {
2539           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2540             {
2541               rtx xop0, temp, last;
2542
2543               last = get_last_insn ();
2544
2545               if (target == 0)
2546                 target = gen_reg_rtx (mode);
2547               xop0 = widen_operand (op0, wider_mode, mode,
2548                                     unoptab != clrsb_optab, false);
2549               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2550                                   unoptab != clrsb_optab);
2551               if (temp != 0)
2552                 temp = expand_binop
2553                   (wider_mode, sub_optab, temp,
2554                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
2555                                  - GET_MODE_PRECISION (mode),
2556                                  wider_mode),
2557                    target, true, OPTAB_DIRECT);
2558               if (temp == 0)
2559                 delete_insns_since (last);
2560
2561               return temp;
2562             }
2563         }
2564     }
2565   return 0;
2566 }
2567
2568 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2569    quantities, choosing which based on whether the high word is nonzero.  */
2570 static rtx
2571 expand_doubleword_clz (enum machine_mode mode, rtx op0, rtx target)
2572 {
2573   rtx xop0 = force_reg (mode, op0);
2574   rtx subhi = gen_highpart (word_mode, xop0);
2575   rtx sublo = gen_lowpart (word_mode, xop0);
2576   rtx hi0_label = gen_label_rtx ();
2577   rtx after_label = gen_label_rtx ();
2578   rtx seq, temp, result;
2579
2580   /* If we were not given a target, use a word_mode register, not a
2581      'mode' register.  The result will fit, and nobody is expecting
2582      anything bigger (the return type of __builtin_clz* is int).  */
2583   if (!target)
2584     target = gen_reg_rtx (word_mode);
2585
2586   /* In any case, write to a word_mode scratch in both branches of the
2587      conditional, so we can ensure there is a single move insn setting
2588      'target' to tag a REG_EQUAL note on.  */
2589   result = gen_reg_rtx (word_mode);
2590
2591   start_sequence ();
2592
2593   /* If the high word is not equal to zero,
2594      then clz of the full value is clz of the high word.  */
2595   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2596                            word_mode, true, hi0_label);
2597
2598   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2599   if (!temp)
2600     goto fail;
2601
2602   if (temp != result)
2603     convert_move (result, temp, true);
2604
2605   emit_jump_insn (gen_jump (after_label));
2606   emit_barrier ();
2607
2608   /* Else clz of the full value is clz of the low word plus the number
2609      of bits in the high word.  */
2610   emit_label (hi0_label);
2611
2612   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2613   if (!temp)
2614     goto fail;
2615   temp = expand_binop (word_mode, add_optab, temp,
2616                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2617                        result, true, OPTAB_DIRECT);
2618   if (!temp)
2619     goto fail;
2620   if (temp != result)
2621     convert_move (result, temp, true);
2622
2623   emit_label (after_label);
2624   convert_move (target, result, true);
2625
2626   seq = get_insns ();
2627   end_sequence ();
2628
2629   add_equal_note (seq, target, CLZ, xop0, 0);
2630   emit_insn (seq);
2631   return target;
2632
2633  fail:
2634   end_sequence ();
2635   return 0;
2636 }
2637
2638 /* Try calculating
2639         (bswap:narrow x)
2640    as
2641         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2642 static rtx
2643 widen_bswap (enum machine_mode mode, rtx op0, rtx target)
2644 {
2645   enum mode_class mclass = GET_MODE_CLASS (mode);
2646   enum machine_mode wider_mode;
2647   rtx x, last;
2648
2649   if (!CLASS_HAS_WIDER_MODES_P (mclass))
2650     return NULL_RTX;
2651
2652   for (wider_mode = GET_MODE_WIDER_MODE (mode);
2653        wider_mode != VOIDmode;
2654        wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2655     if (optab_handler (bswap_optab, wider_mode) != CODE_FOR_nothing)
2656       goto found;
2657   return NULL_RTX;
2658
2659  found:
2660   last = get_last_insn ();
2661
2662   x = widen_operand (op0, wider_mode, mode, true, true);
2663   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2664
2665   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2666               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2667   if (x != 0)
2668     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2669                       GET_MODE_BITSIZE (wider_mode)
2670                       - GET_MODE_BITSIZE (mode),
2671                       NULL_RTX, true);
2672
2673   if (x != 0)
2674     {
2675       if (target == 0)
2676         target = gen_reg_rtx (mode);
2677       emit_move_insn (target, gen_lowpart (mode, x));
2678     }
2679   else
2680     delete_insns_since (last);
2681
2682   return target;
2683 }
2684
2685 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2686
2687 static rtx
2688 expand_doubleword_bswap (enum machine_mode mode, rtx op, rtx target)
2689 {
2690   rtx t0, t1;
2691
2692   t1 = expand_unop (word_mode, bswap_optab,
2693                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2694   t0 = expand_unop (word_mode, bswap_optab,
2695                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2696
2697   if (target == 0 || !valid_multiword_target_p (target))
2698     target = gen_reg_rtx (mode);
2699   if (REG_P (target))
2700     emit_clobber (target);
2701   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2702   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2703
2704   return target;
2705 }
2706
2707 /* Try calculating (parity x) as (and (popcount x) 1), where
2708    popcount can also be done in a wider mode.  */
2709 static rtx
2710 expand_parity (enum machine_mode mode, rtx op0, rtx target)
2711 {
2712   enum mode_class mclass = GET_MODE_CLASS (mode);
2713   if (CLASS_HAS_WIDER_MODES_P (mclass))
2714     {
2715       enum machine_mode wider_mode;
2716       for (wider_mode = mode; wider_mode != VOIDmode;
2717            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2718         {
2719           if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2720             {
2721               rtx xop0, temp, last;
2722
2723               last = get_last_insn ();
2724
2725               if (target == 0)
2726                 target = gen_reg_rtx (mode);
2727               xop0 = widen_operand (op0, wider_mode, mode, true, false);
2728               temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2729                                   true);
2730               if (temp != 0)
2731                 temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2732                                      target, true, OPTAB_DIRECT);
2733               if (temp == 0)
2734                 delete_insns_since (last);
2735
2736               return temp;
2737             }
2738         }
2739     }
2740   return 0;
2741 }
2742
2743 /* Try calculating ctz(x) as K - clz(x & -x) ,
2744    where K is GET_MODE_PRECISION(mode) - 1.
2745
2746    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2747    don't have to worry about what the hardware does in that case.  (If
2748    the clz instruction produces the usual value at 0, which is K, the
2749    result of this code sequence will be -1; expand_ffs, below, relies
2750    on this.  It might be nice to have it be K instead, for consistency
2751    with the (very few) processors that provide a ctz with a defined
2752    value, but that would take one more instruction, and it would be
2753    less convenient for expand_ffs anyway.  */
2754
2755 static rtx
2756 expand_ctz (enum machine_mode mode, rtx op0, rtx target)
2757 {
2758   rtx seq, temp;
2759
2760   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2761     return 0;
2762
2763   start_sequence ();
2764
2765   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2766   if (temp)
2767     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2768                          true, OPTAB_DIRECT);
2769   if (temp)
2770     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2771   if (temp)
2772     temp = expand_binop (mode, sub_optab,
2773                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2774                          temp, target,
2775                          true, OPTAB_DIRECT);
2776   if (temp == 0)
2777     {
2778       end_sequence ();
2779       return 0;
2780     }
2781
2782   seq = get_insns ();
2783   end_sequence ();
2784
2785   add_equal_note (seq, temp, CTZ, op0, 0);
2786   emit_insn (seq);
2787   return temp;
2788 }
2789
2790
2791 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2792    else with the sequence used by expand_clz.
2793
2794    The ffs builtin promises to return zero for a zero value and ctz/clz
2795    may have an undefined value in that case.  If they do not give us a
2796    convenient value, we have to generate a test and branch.  */
2797 static rtx
2798 expand_ffs (enum machine_mode mode, rtx op0, rtx target)
2799 {
2800   HOST_WIDE_INT val = 0;
2801   bool defined_at_zero = false;
2802   rtx temp, seq;
2803
2804   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2805     {
2806       start_sequence ();
2807
2808       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2809       if (!temp)
2810         goto fail;
2811
2812       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2813     }
2814   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2815     {
2816       start_sequence ();
2817       temp = expand_ctz (mode, op0, 0);
2818       if (!temp)
2819         goto fail;
2820
2821       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2822         {
2823           defined_at_zero = true;
2824           val = (GET_MODE_PRECISION (mode) - 1) - val;
2825         }
2826     }
2827   else
2828     return 0;
2829
2830   if (defined_at_zero && val == -1)
2831     /* No correction needed at zero.  */;
2832   else
2833     {
2834       /* We don't try to do anything clever with the situation found
2835          on some processors (eg Alpha) where ctz(0:mode) ==
2836          bitsize(mode).  If someone can think of a way to send N to -1
2837          and leave alone all values in the range 0..N-1 (where N is a
2838          power of two), cheaper than this test-and-branch, please add it.
2839
2840          The test-and-branch is done after the operation itself, in case
2841          the operation sets condition codes that can be recycled for this.
2842          (This is true on i386, for instance.)  */
2843
2844       rtx nonzero_label = gen_label_rtx ();
2845       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2846                                mode, true, nonzero_label);
2847
2848       convert_move (temp, GEN_INT (-1), false);
2849       emit_label (nonzero_label);
2850     }
2851
2852   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2853      to produce a value in the range 0..bitsize.  */
2854   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2855                        target, false, OPTAB_DIRECT);
2856   if (!temp)
2857     goto fail;
2858
2859   seq = get_insns ();
2860   end_sequence ();
2861
2862   add_equal_note (seq, temp, FFS, op0, 0);
2863   emit_insn (seq);
2864   return temp;
2865
2866  fail:
2867   end_sequence ();
2868   return 0;
2869 }
2870
2871 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2872    conditions, VAL may already be a SUBREG against which we cannot generate
2873    a further SUBREG.  In this case, we expect forcing the value into a
2874    register will work around the situation.  */
2875
2876 static rtx
2877 lowpart_subreg_maybe_copy (enum machine_mode omode, rtx val,
2878                            enum machine_mode imode)
2879 {
2880   rtx ret;
2881   ret = lowpart_subreg (omode, val, imode);
2882   if (ret == NULL)
2883     {
2884       val = force_reg (imode, val);
2885       ret = lowpart_subreg (omode, val, imode);
2886       gcc_assert (ret != NULL);
2887     }
2888   return ret;
2889 }
2890
2891 /* Expand a floating point absolute value or negation operation via a
2892    logical operation on the sign bit.  */
2893
2894 static rtx
2895 expand_absneg_bit (enum rtx_code code, enum machine_mode mode,
2896                    rtx op0, rtx target)
2897 {
2898   const struct real_format *fmt;
2899   int bitpos, word, nwords, i;
2900   enum machine_mode imode;
2901   double_int mask;
2902   rtx temp, insns;
2903
2904   /* The format has to have a simple sign bit.  */
2905   fmt = REAL_MODE_FORMAT (mode);
2906   if (fmt == NULL)
2907     return NULL_RTX;
2908
2909   bitpos = fmt->signbit_rw;
2910   if (bitpos < 0)
2911     return NULL_RTX;
2912
2913   /* Don't create negative zeros if the format doesn't support them.  */
2914   if (code == NEG && !fmt->has_signed_zero)
2915     return NULL_RTX;
2916
2917   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2918     {
2919       imode = int_mode_for_mode (mode);
2920       if (imode == BLKmode)
2921         return NULL_RTX;
2922       word = 0;
2923       nwords = 1;
2924     }
2925   else
2926     {
2927       imode = word_mode;
2928
2929       if (FLOAT_WORDS_BIG_ENDIAN)
2930         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2931       else
2932         word = bitpos / BITS_PER_WORD;
2933       bitpos = bitpos % BITS_PER_WORD;
2934       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2935     }
2936
2937   mask = double_int_zero.set_bit (bitpos);
2938   if (code == ABS)
2939     mask = ~mask;
2940
2941   if (target == 0
2942       || target == op0
2943       || (nwords > 1 && !valid_multiword_target_p (target)))
2944     target = gen_reg_rtx (mode);
2945
2946   if (nwords > 1)
2947     {
2948       start_sequence ();
2949
2950       for (i = 0; i < nwords; ++i)
2951         {
2952           rtx targ_piece = operand_subword (target, i, 1, mode);
2953           rtx op0_piece = operand_subword_force (op0, i, mode);
2954
2955           if (i == word)
2956             {
2957               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2958                                    op0_piece,
2959                                    immed_double_int_const (mask, imode),
2960                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2961               if (temp != targ_piece)
2962                 emit_move_insn (targ_piece, temp);
2963             }
2964           else
2965             emit_move_insn (targ_piece, op0_piece);
2966         }
2967
2968       insns = get_insns ();
2969       end_sequence ();
2970
2971       emit_insn (insns);
2972     }
2973   else
2974     {
2975       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2976                            gen_lowpart (imode, op0),
2977                            immed_double_int_const (mask, imode),
2978                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2979       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2980
2981       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2982                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2983                         target);
2984     }
2985
2986   return target;
2987 }
2988
2989 /* As expand_unop, but will fail rather than attempt the operation in a
2990    different mode or with a libcall.  */
2991 static rtx
2992 expand_unop_direct (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
2993              int unsignedp)
2994 {
2995   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2996     {
2997       struct expand_operand ops[2];
2998       enum insn_code icode = optab_handler (unoptab, mode);
2999       rtx last = get_last_insn ();
3000       rtx pat;
3001
3002       create_output_operand (&ops[0], target, mode);
3003       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
3004       pat = maybe_gen_insn (icode, 2, ops);
3005       if (pat)
3006         {
3007           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3008               && ! add_equal_note (pat, ops[0].value, optab_to_code (unoptab),
3009                                    ops[1].value, NULL_RTX))
3010             {
3011               delete_insns_since (last);
3012               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
3013             }
3014
3015           emit_insn (pat);
3016
3017           return ops[0].value;
3018         }
3019     }
3020   return 0;
3021 }
3022
3023 /* Generate code to perform an operation specified by UNOPTAB
3024    on operand OP0, with result having machine-mode MODE.
3025
3026    UNSIGNEDP is for the case where we have to widen the operands
3027    to perform the operation.  It says to use zero-extension.
3028
3029    If TARGET is nonzero, the value
3030    is generated there, if it is convenient to do so.
3031    In all cases an rtx is returned for the locus of the value;
3032    this may or may not be TARGET.  */
3033
3034 rtx
3035 expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
3036              int unsignedp)
3037 {
3038   enum mode_class mclass = GET_MODE_CLASS (mode);
3039   enum machine_mode wider_mode;
3040   rtx temp;
3041   rtx libfunc;
3042
3043   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
3044   if (temp)
3045     return temp;
3046
3047   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
3048
3049   /* Widening (or narrowing) clz needs special treatment.  */
3050   if (unoptab == clz_optab)
3051     {
3052       temp = widen_leading (mode, op0, target, unoptab);
3053       if (temp)
3054         return temp;
3055
3056       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3057           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3058         {
3059           temp = expand_doubleword_clz (mode, op0, target);
3060           if (temp)
3061             return temp;
3062         }
3063
3064       goto try_libcall;
3065     }
3066
3067   if (unoptab == clrsb_optab)
3068     {
3069       temp = widen_leading (mode, op0, target, unoptab);
3070       if (temp)
3071         return temp;
3072       goto try_libcall;
3073     }
3074
3075   /* Widening (or narrowing) bswap needs special treatment.  */
3076   if (unoptab == bswap_optab)
3077     {
3078       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
3079          or ROTATERT.  First try these directly; if this fails, then try the
3080          obvious pair of shifts with allowed widening, as this will probably
3081          be always more efficient than the other fallback methods.  */
3082       if (mode == HImode)
3083         {
3084           rtx last, temp1, temp2;
3085
3086           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
3087             {
3088               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
3089                                    unsignedp, OPTAB_DIRECT);
3090               if (temp)
3091                 return temp;
3092              }
3093
3094           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
3095             {
3096               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
3097                                    unsignedp, OPTAB_DIRECT);
3098               if (temp)
3099                 return temp;
3100             }
3101
3102           last = get_last_insn ();
3103
3104           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
3105                                 unsignedp, OPTAB_WIDEN);
3106           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
3107                                 unsignedp, OPTAB_WIDEN);
3108           if (temp1 && temp2)
3109             {
3110               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
3111                                    unsignedp, OPTAB_WIDEN);
3112               if (temp)
3113                 return temp;
3114             }
3115
3116           delete_insns_since (last);
3117         }
3118
3119       temp = widen_bswap (mode, op0, target);
3120       if (temp)
3121         return temp;
3122
3123       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3124           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3125         {
3126           temp = expand_doubleword_bswap (mode, op0, target);
3127           if (temp)
3128             return temp;
3129         }
3130
3131       goto try_libcall;
3132     }
3133
3134   if (CLASS_HAS_WIDER_MODES_P (mclass))
3135     for (wider_mode = GET_MODE_WIDER_MODE (mode);
3136          wider_mode != VOIDmode;
3137          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3138       {
3139         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
3140           {
3141             rtx xop0 = op0;
3142             rtx last = get_last_insn ();
3143
3144             /* For certain operations, we need not actually extend
3145                the narrow operand, as long as we will truncate the
3146                results to the same narrowness.  */
3147
3148             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3149                                   (unoptab == neg_optab
3150                                    || unoptab == one_cmpl_optab)
3151                                   && mclass == MODE_INT);
3152
3153             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3154                                 unsignedp);
3155
3156             if (temp)
3157               {
3158                 if (mclass != MODE_INT
3159                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
3160                   {
3161                     if (target == 0)
3162                       target = gen_reg_rtx (mode);
3163                     convert_move (target, temp, 0);
3164                     return target;
3165                   }
3166                 else
3167                   return gen_lowpart (mode, temp);
3168               }
3169             else
3170               delete_insns_since (last);
3171           }
3172       }
3173
3174   /* These can be done a word at a time.  */
3175   if (unoptab == one_cmpl_optab
3176       && mclass == MODE_INT
3177       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
3178       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3179     {
3180       int i;
3181       rtx insns;
3182
3183       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
3184         target = gen_reg_rtx (mode);
3185
3186       start_sequence ();
3187
3188       /* Do the actual arithmetic.  */
3189       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
3190         {
3191           rtx target_piece = operand_subword (target, i, 1, mode);
3192           rtx x = expand_unop (word_mode, unoptab,
3193                                operand_subword_force (op0, i, mode),
3194                                target_piece, unsignedp);
3195
3196           if (target_piece != x)
3197             emit_move_insn (target_piece, x);
3198         }
3199
3200       insns = get_insns ();
3201       end_sequence ();
3202
3203       emit_insn (insns);
3204       return target;
3205     }
3206
3207   if (optab_to_code (unoptab) == NEG)
3208     {
3209       /* Try negating floating point values by flipping the sign bit.  */
3210       if (SCALAR_FLOAT_MODE_P (mode))
3211         {
3212           temp = expand_absneg_bit (NEG, mode, op0, target);
3213           if (temp)
3214             return temp;
3215         }
3216
3217       /* If there is no negation pattern, and we have no negative zero,
3218          try subtracting from zero.  */
3219       if (!HONOR_SIGNED_ZEROS (mode))
3220         {
3221           temp = expand_binop (mode, (unoptab == negv_optab
3222                                       ? subv_optab : sub_optab),
3223                                CONST0_RTX (mode), op0, target,
3224                                unsignedp, OPTAB_DIRECT);
3225           if (temp)
3226             return temp;
3227         }
3228     }
3229
3230   /* Try calculating parity (x) as popcount (x) % 2.  */
3231   if (unoptab == parity_optab)
3232     {
3233       temp = expand_parity (mode, op0, target);
3234       if (temp)
3235         return temp;
3236     }
3237
3238   /* Try implementing ffs (x) in terms of clz (x).  */
3239   if (unoptab == ffs_optab)
3240     {
3241       temp = expand_ffs (mode, op0, target);
3242       if (temp)
3243         return temp;
3244     }
3245
3246   /* Try implementing ctz (x) in terms of clz (x).  */
3247   if (unoptab == ctz_optab)
3248     {
3249       temp = expand_ctz (mode, op0, target);
3250       if (temp)
3251         return temp;
3252     }
3253
3254  try_libcall:
3255   /* Now try a library call in this mode.  */
3256   libfunc = optab_libfunc (unoptab, mode);
3257   if (libfunc)
3258     {
3259       rtx insns;
3260       rtx value;
3261       rtx eq_value;
3262       enum machine_mode outmode = mode;
3263
3264       /* All of these functions return small values.  Thus we choose to
3265          have them return something that isn't a double-word.  */
3266       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3267           || unoptab == clrsb_optab || unoptab == popcount_optab
3268           || unoptab == parity_optab)
3269         outmode
3270           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3271                                           optab_libfunc (unoptab, mode)));
3272
3273       start_sequence ();
3274
3275       /* Pass 1 for NO_QUEUE so we don't lose any increments
3276          if the libcall is cse'd or moved.  */
3277       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3278                                        1, op0, mode);
3279       insns = get_insns ();
3280       end_sequence ();
3281
3282       target = gen_reg_rtx (outmode);
3283       eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3284       if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
3285         eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3286       else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
3287         eq_value = simplify_gen_unary (ZERO_EXTEND, outmode, eq_value, mode);
3288       emit_libcall_block_1 (insns, target, value, eq_value,
3289                             trapv_unoptab_p (unoptab));
3290
3291       return target;
3292     }
3293
3294   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3295
3296   if (CLASS_HAS_WIDER_MODES_P (mclass))
3297     {
3298       for (wider_mode = GET_MODE_WIDER_MODE (mode);
3299            wider_mode != VOIDmode;
3300            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3301         {
3302           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3303               || optab_libfunc (unoptab, wider_mode))
3304             {
3305               rtx xop0 = op0;
3306               rtx last = get_last_insn ();
3307
3308               /* For certain operations, we need not actually extend
3309                  the narrow operand, as long as we will truncate the
3310                  results to the same narrowness.  */
3311               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3312                                     (unoptab == neg_optab
3313                                      || unoptab == one_cmpl_optab
3314                                      || unoptab == bswap_optab)
3315                                     && mclass == MODE_INT);
3316
3317               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3318                                   unsignedp);
3319
3320               /* If we are generating clz using wider mode, adjust the
3321                  result.  Similarly for clrsb.  */
3322               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3323                   && temp != 0)
3324                 temp = expand_binop
3325                   (wider_mode, sub_optab, temp,
3326                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
3327                                  - GET_MODE_PRECISION (mode),
3328                                  wider_mode),
3329                    target, true, OPTAB_DIRECT);
3330
3331               /* Likewise for bswap.  */
3332               if (unoptab == bswap_optab && temp != 0)
3333                 {
3334                   gcc_assert (GET_MODE_PRECISION (wider_mode)
3335                               == GET_MODE_BITSIZE (wider_mode)
3336                               && GET_MODE_PRECISION (mode)
3337                                  == GET_MODE_BITSIZE (mode));
3338
3339                   temp = expand_shift (RSHIFT_EXPR, wider_mode, temp,
3340                                        GET_MODE_BITSIZE (wider_mode)
3341                                        - GET_MODE_BITSIZE (mode),
3342                                        NULL_RTX, true);
3343                 }
3344
3345               if (temp)
3346                 {
3347                   if (mclass != MODE_INT)
3348                     {
3349                       if (target == 0)
3350                         target = gen_reg_rtx (mode);
3351                       convert_move (target, temp, 0);
3352                       return target;
3353                     }
3354                   else
3355                     return gen_lowpart (mode, temp);
3356                 }
3357               else
3358                 delete_insns_since (last);
3359             }
3360         }
3361     }
3362
3363   /* One final attempt at implementing negation via subtraction,
3364      this time allowing widening of the operand.  */
3365   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3366     {
3367       rtx temp;
3368       temp = expand_binop (mode,
3369                            unoptab == negv_optab ? subv_optab : sub_optab,
3370                            CONST0_RTX (mode), op0,
3371                            target, unsignedp, OPTAB_LIB_WIDEN);
3372       if (temp)
3373         return temp;
3374     }
3375
3376   return 0;
3377 }
3378 \f
3379 /* Emit code to compute the absolute value of OP0, with result to
3380    TARGET if convenient.  (TARGET may be 0.)  The return value says
3381    where the result actually is to be found.
3382
3383    MODE is the mode of the operand; the mode of the result is
3384    different but can be deduced from MODE.
3385
3386  */
3387
3388 rtx
3389 expand_abs_nojump (enum machine_mode mode, rtx op0, rtx target,
3390                    int result_unsignedp)
3391 {
3392   rtx temp;
3393
3394   if (GET_MODE_CLASS (mode) != MODE_INT
3395       || ! flag_trapv)
3396     result_unsignedp = 1;
3397
3398   /* First try to do it with a special abs instruction.  */
3399   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3400                       op0, target, 0);
3401   if (temp != 0)
3402     return temp;
3403
3404   /* For floating point modes, try clearing the sign bit.  */
3405   if (SCALAR_FLOAT_MODE_P (mode))
3406     {
3407       temp = expand_absneg_bit (ABS, mode, op0, target);
3408       if (temp)
3409         return temp;
3410     }
3411
3412   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3413   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3414       && !HONOR_SIGNED_ZEROS (mode))
3415     {
3416       rtx last = get_last_insn ();
3417
3418       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3419                           op0, NULL_RTX, 0);
3420       if (temp != 0)
3421         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3422                              OPTAB_WIDEN);
3423
3424       if (temp != 0)
3425         return temp;
3426
3427       delete_insns_since (last);
3428     }
3429
3430   /* If this machine has expensive jumps, we can do integer absolute
3431      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3432      where W is the width of MODE.  */
3433
3434   if (GET_MODE_CLASS (mode) == MODE_INT
3435       && BRANCH_COST (optimize_insn_for_speed_p (),
3436                       false) >= 2)
3437     {
3438       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3439                                    GET_MODE_PRECISION (mode) - 1,
3440                                    NULL_RTX, 0);
3441
3442       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3443                            OPTAB_LIB_WIDEN);
3444       if (temp != 0)
3445         temp = expand_binop (mode, result_unsignedp ? sub_optab : subv_optab,
3446                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3447
3448       if (temp != 0)
3449         return temp;
3450     }
3451
3452   return NULL_RTX;
3453 }
3454
3455 rtx
3456 expand_abs (enum machine_mode mode, rtx op0, rtx target,
3457             int result_unsignedp, int safe)
3458 {
3459   rtx temp, op1;
3460
3461   if (GET_MODE_CLASS (mode) != MODE_INT
3462       || ! flag_trapv)
3463     result_unsignedp = 1;
3464
3465   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3466   if (temp != 0)
3467     return temp;
3468
3469   /* If that does not win, use conditional jump and negate.  */
3470
3471   /* It is safe to use the target if it is the same
3472      as the source if this is also a pseudo register */
3473   if (op0 == target && REG_P (op0)
3474       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3475     safe = 1;
3476
3477   op1 = gen_label_rtx ();
3478   if (target == 0 || ! safe
3479       || GET_MODE (target) != mode
3480       || (MEM_P (target) && MEM_VOLATILE_P (target))
3481       || (REG_P (target)
3482           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3483     target = gen_reg_rtx (mode);
3484
3485   emit_move_insn (target, op0);
3486   NO_DEFER_POP;
3487
3488   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3489                            NULL_RTX, NULL_RTX, op1, -1);
3490
3491   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3492                      target, target, 0);
3493   if (op0 != target)
3494     emit_move_insn (target, op0);
3495   emit_label (op1);
3496   OK_DEFER_POP;
3497   return target;
3498 }
3499
3500 /* Emit code to compute the one's complement absolute value of OP0
3501    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3502    (TARGET may be NULL_RTX.)  The return value says where the result
3503    actually is to be found.
3504
3505    MODE is the mode of the operand; the mode of the result is
3506    different but can be deduced from MODE.  */
3507
3508 rtx
3509 expand_one_cmpl_abs_nojump (enum machine_mode mode, rtx op0, rtx target)
3510 {
3511   rtx temp;
3512
3513   /* Not applicable for floating point modes.  */
3514   if (FLOAT_MODE_P (mode))
3515     return NULL_RTX;
3516
3517   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3518   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3519     {
3520       rtx last = get_last_insn ();
3521
3522       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3523       if (temp != 0)
3524         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3525                              OPTAB_WIDEN);
3526
3527       if (temp != 0)
3528         return temp;
3529
3530       delete_insns_since (last);
3531     }
3532
3533   /* If this machine has expensive jumps, we can do one's complement
3534      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3535
3536   if (GET_MODE_CLASS (mode) == MODE_INT
3537       && BRANCH_COST (optimize_insn_for_speed_p (),
3538                      false) >= 2)
3539     {
3540       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3541                                    GET_MODE_PRECISION (mode) - 1,
3542                                    NULL_RTX, 0);
3543
3544       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3545                            OPTAB_LIB_WIDEN);
3546
3547       if (temp != 0)
3548         return temp;
3549     }
3550
3551   return NULL_RTX;
3552 }
3553
3554 /* A subroutine of expand_copysign, perform the copysign operation using the
3555    abs and neg primitives advertised to exist on the target.  The assumption
3556    is that we have a split register file, and leaving op0 in fp registers,
3557    and not playing with subregs so much, will help the register allocator.  */
3558
3559 static rtx
3560 expand_copysign_absneg (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3561                         int bitpos, bool op0_is_abs)
3562 {
3563   enum machine_mode imode;
3564   enum insn_code icode;
3565   rtx sign, label;
3566
3567   if (target == op1)
3568     target = NULL_RTX;
3569
3570   /* Check if the back end provides an insn that handles signbit for the
3571      argument's mode. */
3572   icode = optab_handler (signbit_optab, mode);
3573   if (icode != CODE_FOR_nothing)
3574     {
3575       imode = insn_data[(int) icode].operand[0].mode;
3576       sign = gen_reg_rtx (imode);
3577       emit_unop_insn (icode, sign, op1, UNKNOWN);
3578     }
3579   else
3580     {
3581       double_int mask;
3582
3583       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3584         {
3585           imode = int_mode_for_mode (mode);
3586           if (imode == BLKmode)
3587             return NULL_RTX;
3588           op1 = gen_lowpart (imode, op1);
3589         }
3590       else
3591         {
3592           int word;
3593
3594           imode = word_mode;
3595           if (FLOAT_WORDS_BIG_ENDIAN)
3596             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3597           else
3598             word = bitpos / BITS_PER_WORD;
3599           bitpos = bitpos % BITS_PER_WORD;
3600           op1 = operand_subword_force (op1, word, mode);
3601         }
3602
3603       mask = double_int_zero.set_bit (bitpos);
3604
3605       sign = expand_binop (imode, and_optab, op1,
3606                            immed_double_int_const (mask, imode),
3607                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3608     }
3609
3610   if (!op0_is_abs)
3611     {
3612       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3613       if (op0 == NULL)
3614         return NULL_RTX;
3615       target = op0;
3616     }
3617   else
3618     {
3619       if (target == NULL_RTX)
3620         target = copy_to_reg (op0);
3621       else
3622         emit_move_insn (target, op0);
3623     }
3624
3625   label = gen_label_rtx ();
3626   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3627
3628   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3629     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3630   else
3631     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3632   if (op0 != target)
3633     emit_move_insn (target, op0);
3634
3635   emit_label (label);
3636
3637   return target;
3638 }
3639
3640
3641 /* A subroutine of expand_copysign, perform the entire copysign operation
3642    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3643    is true if op0 is known to have its sign bit clear.  */
3644
3645 static rtx
3646 expand_copysign_bit (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3647                      int bitpos, bool op0_is_abs)
3648 {
3649   enum machine_mode imode;
3650   double_int mask;
3651   int word, nwords, i;
3652   rtx temp, insns;
3653
3654   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3655     {
3656       imode = int_mode_for_mode (mode);
3657       if (imode == BLKmode)
3658         return NULL_RTX;
3659       word = 0;
3660       nwords = 1;
3661     }
3662   else
3663     {
3664       imode = word_mode;
3665
3666       if (FLOAT_WORDS_BIG_ENDIAN)
3667         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3668       else
3669         word = bitpos / BITS_PER_WORD;
3670       bitpos = bitpos % BITS_PER_WORD;
3671       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3672     }
3673
3674   mask = double_int_zero.set_bit (bitpos);
3675
3676   if (target == 0
3677       || target == op0
3678       || target == op1
3679       || (nwords > 1 && !valid_multiword_target_p (target)))
3680     target = gen_reg_rtx (mode);
3681
3682   if (nwords > 1)
3683     {
3684       start_sequence ();
3685
3686       for (i = 0; i < nwords; ++i)
3687         {
3688           rtx targ_piece = operand_subword (target, i, 1, mode);
3689           rtx op0_piece = operand_subword_force (op0, i, mode);
3690
3691           if (i == word)
3692             {
3693               if (!op0_is_abs)
3694                 op0_piece
3695                   = expand_binop (imode, and_optab, op0_piece,
3696                                   immed_double_int_const (~mask, imode),
3697                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3698
3699               op1 = expand_binop (imode, and_optab,
3700                                   operand_subword_force (op1, i, mode),
3701                                   immed_double_int_const (mask, imode),
3702                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3703
3704               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3705                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3706               if (temp != targ_piece)
3707                 emit_move_insn (targ_piece, temp);
3708             }
3709           else
3710             emit_move_insn (targ_piece, op0_piece);
3711         }
3712
3713       insns = get_insns ();
3714       end_sequence ();
3715
3716       emit_insn (insns);
3717     }
3718   else
3719     {
3720       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3721                           immed_double_int_const (mask, imode),
3722                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3723
3724       op0 = gen_lowpart (imode, op0);
3725       if (!op0_is_abs)
3726         op0 = expand_binop (imode, and_optab, op0,
3727                             immed_double_int_const (~mask, imode),
3728                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3729
3730       temp = expand_binop (imode, ior_optab, op0, op1,
3731                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3732       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3733     }
3734
3735   return target;
3736 }
3737
3738 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3739    scalar floating point mode.  Return NULL if we do not know how to
3740    expand the operation inline.  */
3741
3742 rtx
3743 expand_copysign (rtx op0, rtx op1, rtx target)
3744 {
3745   enum machine_mode mode = GET_MODE (op0);
3746   const struct real_format *fmt;
3747   bool op0_is_abs;
3748   rtx temp;
3749
3750   gcc_assert (SCALAR_FLOAT_MODE_P (mode));
3751   gcc_assert (GET_MODE (op1) == mode);
3752
3753   /* First try to do it with a special instruction.  */
3754   temp = expand_binop (mode, copysign_optab, op0, op1,
3755                        target, 0, OPTAB_DIRECT);
3756   if (temp)
3757     return temp;
3758
3759   fmt = REAL_MODE_FORMAT (mode);
3760   if (fmt == NULL || !fmt->has_signed_zero)
3761     return NULL_RTX;
3762
3763   op0_is_abs = false;
3764   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3765     {
3766       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3767         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3768       op0_is_abs = true;
3769     }
3770
3771   if (fmt->signbit_ro >= 0
3772       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3773           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3774               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3775     {
3776       temp = expand_copysign_absneg (mode, op0, op1, target,
3777                                      fmt->signbit_ro, op0_is_abs);
3778       if (temp)
3779         return temp;
3780     }
3781
3782   if (fmt->signbit_rw < 0)
3783     return NULL_RTX;
3784   return expand_copysign_bit (mode, op0, op1, target,
3785                               fmt->signbit_rw, op0_is_abs);
3786 }
3787 \f
3788 /* Generate an instruction whose insn-code is INSN_CODE,
3789    with two operands: an output TARGET and an input OP0.
3790    TARGET *must* be nonzero, and the output is always stored there.
3791    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3792    the value that is stored into TARGET.
3793
3794    Return false if expansion failed.  */
3795
3796 bool
3797 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3798                       enum rtx_code code)
3799 {
3800   struct expand_operand ops[2];
3801   rtx pat;
3802
3803   create_output_operand (&ops[0], target, GET_MODE (target));
3804   create_input_operand (&ops[1], op0, GET_MODE (op0));
3805   pat = maybe_gen_insn (icode, 2, ops);
3806   if (!pat)
3807     return false;
3808
3809   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX && code != UNKNOWN)
3810     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3811
3812   emit_insn (pat);
3813
3814   if (ops[0].value != target)
3815     emit_move_insn (target, ops[0].value);
3816   return true;
3817 }
3818 /* Generate an instruction whose insn-code is INSN_CODE,
3819    with two operands: an output TARGET and an input OP0.
3820    TARGET *must* be nonzero, and the output is always stored there.
3821    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3822    the value that is stored into TARGET.  */
3823
3824 void
3825 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3826 {
3827   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3828   gcc_assert (ok);
3829 }
3830 \f
3831 struct no_conflict_data
3832 {
3833   rtx target, first, insn;
3834   bool must_stay;
3835 };
3836
3837 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3838    the currently examined clobber / store has to stay in the list of
3839    insns that constitute the actual libcall block.  */
3840 static void
3841 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3842 {
3843   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3844
3845   /* If this inns directly contributes to setting the target, it must stay.  */
3846   if (reg_overlap_mentioned_p (p->target, dest))
3847     p->must_stay = true;
3848   /* If we haven't committed to keeping any other insns in the list yet,
3849      there is nothing more to check.  */
3850   else if (p->insn == p->first)
3851     return;
3852   /* If this insn sets / clobbers a register that feeds one of the insns
3853      already in the list, this insn has to stay too.  */
3854   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3855            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3856            || reg_used_between_p (dest, p->first, p->insn)
3857            /* Likewise if this insn depends on a register set by a previous
3858               insn in the list, or if it sets a result (presumably a hard
3859               register) that is set or clobbered by a previous insn.
3860               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3861               SET_DEST perform the former check on the address, and the latter
3862               check on the MEM.  */
3863            || (GET_CODE (set) == SET
3864                && (modified_in_p (SET_SRC (set), p->first)
3865                    || modified_in_p (SET_DEST (set), p->first)
3866                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3867                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3868     p->must_stay = true;
3869 }
3870
3871 \f
3872 /* Emit code to make a call to a constant function or a library call.
3873
3874    INSNS is a list containing all insns emitted in the call.
3875    These insns leave the result in RESULT.  Our block is to copy RESULT
3876    to TARGET, which is logically equivalent to EQUIV.
3877
3878    We first emit any insns that set a pseudo on the assumption that these are
3879    loading constants into registers; doing so allows them to be safely cse'ed
3880    between blocks.  Then we emit all the other insns in the block, followed by
3881    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3882    note with an operand of EQUIV.  */
3883
3884 static void
3885 emit_libcall_block_1 (rtx insns, rtx target, rtx result, rtx equiv,
3886                       bool equiv_may_trap)
3887 {
3888   rtx final_dest = target;
3889   rtx next, last, insn;
3890
3891   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3892      into a MEM later.  Protect the libcall block from this change.  */
3893   if (! REG_P (target) || REG_USERVAR_P (target))
3894     target = gen_reg_rtx (GET_MODE (target));
3895
3896   /* If we're using non-call exceptions, a libcall corresponding to an
3897      operation that may trap may also trap.  */
3898   /* ??? See the comment in front of make_reg_eh_region_note.  */
3899   if (cfun->can_throw_non_call_exceptions
3900       && (equiv_may_trap || may_trap_p (equiv)))
3901     {
3902       for (insn = insns; insn; insn = NEXT_INSN (insn))
3903         if (CALL_P (insn))
3904           {
3905             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3906             if (note)
3907               {
3908                 int lp_nr = INTVAL (XEXP (note, 0));
3909                 if (lp_nr == 0 || lp_nr == INT_MIN)
3910                   remove_note (insn, note);
3911               }
3912           }
3913     }
3914   else
3915     {
3916       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3917          reg note to indicate that this call cannot throw or execute a nonlocal
3918          goto (unless there is already a REG_EH_REGION note, in which case
3919          we update it).  */
3920       for (insn = insns; insn; insn = NEXT_INSN (insn))
3921         if (CALL_P (insn))
3922           make_reg_eh_region_note_nothrow_nononlocal (insn);
3923     }
3924
3925   /* First emit all insns that set pseudos.  Remove them from the list as
3926      we go.  Avoid insns that set pseudos which were referenced in previous
3927      insns.  These can be generated by move_by_pieces, for example,
3928      to update an address.  Similarly, avoid insns that reference things
3929      set in previous insns.  */
3930
3931   for (insn = insns; insn; insn = next)
3932     {
3933       rtx set = single_set (insn);
3934
3935       next = NEXT_INSN (insn);
3936
3937       if (set != 0 && REG_P (SET_DEST (set))
3938           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3939         {
3940           struct no_conflict_data data;
3941
3942           data.target = const0_rtx;
3943           data.first = insns;
3944           data.insn = insn;
3945           data.must_stay = 0;
3946           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3947           if (! data.must_stay)
3948             {
3949               if (PREV_INSN (insn))
3950                 NEXT_INSN (PREV_INSN (insn)) = next;
3951               else
3952                 insns = next;
3953
3954               if (next)
3955                 PREV_INSN (next) = PREV_INSN (insn);
3956
3957               add_insn (insn);
3958             }
3959         }
3960
3961       /* Some ports use a loop to copy large arguments onto the stack.
3962          Don't move anything outside such a loop.  */
3963       if (LABEL_P (insn))
3964         break;
3965     }
3966
3967   /* Write the remaining insns followed by the final copy.  */
3968   for (insn = insns; insn; insn = next)
3969     {
3970       next = NEXT_INSN (insn);
3971
3972       add_insn (insn);
3973     }
3974
3975   last = emit_move_insn (target, result);
3976   set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3977
3978   if (final_dest != target)
3979     emit_move_insn (final_dest, target);
3980 }
3981
3982 void
3983 emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
3984 {
3985   emit_libcall_block_1 (insns, target, result, equiv, false);
3986 }
3987 \f
3988 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3989    PURPOSE describes how this comparison will be used.  CODE is the rtx
3990    comparison code we will be using.
3991
3992    ??? Actually, CODE is slightly weaker than that.  A target is still
3993    required to implement all of the normal bcc operations, but not
3994    required to implement all (or any) of the unordered bcc operations.  */
3995
3996 int
3997 can_compare_p (enum rtx_code code, enum machine_mode mode,
3998                enum can_compare_purpose purpose)
3999 {
4000   rtx test;
4001   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
4002   do
4003     {
4004       enum insn_code icode;
4005
4006       if (purpose == ccp_jump
4007           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
4008           && insn_operand_matches (icode, 0, test))
4009         return 1;
4010       if (purpose == ccp_store_flag
4011           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
4012           && insn_operand_matches (icode, 1, test))
4013         return 1;
4014       if (purpose == ccp_cmov
4015           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
4016         return 1;
4017
4018       mode = GET_MODE_WIDER_MODE (mode);
4019       PUT_MODE (test, mode);
4020     }
4021   while (mode != VOIDmode);
4022
4023   return 0;
4024 }
4025
4026 /* This function is called when we are going to emit a compare instruction that
4027    compares the values found in *PX and *PY, using the rtl operator COMPARISON.
4028
4029    *PMODE is the mode of the inputs (in case they are const_int).
4030    *PUNSIGNEDP nonzero says that the operands are unsigned;
4031    this matters if they need to be widened (as given by METHODS).
4032
4033    If they have mode BLKmode, then SIZE specifies the size of both operands.
4034
4035    This function performs all the setup necessary so that the caller only has
4036    to emit a single comparison insn.  This setup can involve doing a BLKmode
4037    comparison or emitting a library call to perform the comparison if no insn
4038    is available to handle it.
4039    The values which are passed in through pointers can be modified; the caller
4040    should perform the comparison on the modified values.  Constant
4041    comparisons must have already been folded.  */
4042
4043 static void
4044 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
4045                   int unsignedp, enum optab_methods methods,
4046                   rtx *ptest, enum machine_mode *pmode)
4047 {
4048   enum machine_mode mode = *pmode;
4049   rtx libfunc, test;
4050   enum machine_mode cmp_mode;
4051   enum mode_class mclass;
4052
4053   /* The other methods are not needed.  */
4054   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
4055               || methods == OPTAB_LIB_WIDEN);
4056
4057   /* If we are optimizing, force expensive constants into a register.  */
4058   if (CONSTANT_P (x) && optimize
4059       && (rtx_cost (x, COMPARE, 0, optimize_insn_for_speed_p ())
4060           > COSTS_N_INSNS (1)))
4061     x = force_reg (mode, x);
4062
4063   if (CONSTANT_P (y) && optimize
4064       && (rtx_cost (y, COMPARE, 1, optimize_insn_for_speed_p ())
4065           > COSTS_N_INSNS (1)))
4066     y = force_reg (mode, y);
4067
4068 #ifdef HAVE_cc0
4069   /* Make sure if we have a canonical comparison.  The RTL
4070      documentation states that canonical comparisons are required only
4071      for targets which have cc0.  */
4072   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
4073 #endif
4074
4075   /* Don't let both operands fail to indicate the mode.  */
4076   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
4077     x = force_reg (mode, x);
4078   if (mode == VOIDmode)
4079     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
4080
4081   /* Handle all BLKmode compares.  */
4082
4083   if (mode == BLKmode)
4084     {
4085       enum machine_mode result_mode;
4086       enum insn_code cmp_code;
4087       tree length_type;
4088       rtx libfunc;
4089       rtx result;
4090       rtx opalign
4091         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
4092
4093       gcc_assert (size);
4094
4095       /* Try to use a memory block compare insn - either cmpstr
4096          or cmpmem will do.  */
4097       for (cmp_mode = GET_CLASS_NARROWEST_MODE (MODE_INT);
4098            cmp_mode != VOIDmode;
4099            cmp_mode = GET_MODE_WIDER_MODE (cmp_mode))
4100         {
4101           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
4102           if (cmp_code == CODE_FOR_nothing)
4103             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
4104           if (cmp_code == CODE_FOR_nothing)
4105             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
4106           if (cmp_code == CODE_FOR_nothing)
4107             continue;
4108
4109           /* Must make sure the size fits the insn's mode.  */
4110           if ((CONST_INT_P (size)
4111                && INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode)))
4112               || (GET_MODE_BITSIZE (GET_MODE (size))
4113                   > GET_MODE_BITSIZE (cmp_mode)))
4114             continue;
4115
4116           result_mode = insn_data[cmp_code].operand[0].mode;
4117           result = gen_reg_rtx (result_mode);
4118           size = convert_to_mode (cmp_mode, size, 1);
4119           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
4120
4121           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
4122           *pmode = result_mode;
4123           return;
4124         }
4125
4126       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
4127         goto fail;
4128
4129       /* Otherwise call a library function, memcmp.  */
4130       libfunc = memcmp_libfunc;
4131       length_type = sizetype;
4132       result_mode = TYPE_MODE (integer_type_node);
4133       cmp_mode = TYPE_MODE (length_type);
4134       size = convert_to_mode (TYPE_MODE (length_type), size,
4135                               TYPE_UNSIGNED (length_type));
4136
4137       result = emit_library_call_value (libfunc, 0, LCT_PURE,
4138                                         result_mode, 3,
4139                                         XEXP (x, 0), Pmode,
4140                                         XEXP (y, 0), Pmode,
4141                                         size, cmp_mode);
4142       x = result;
4143       y = const0_rtx;
4144       mode = result_mode;
4145       methods = OPTAB_LIB_WIDEN;
4146       unsignedp = false;
4147     }
4148
4149   /* Don't allow operands to the compare to trap, as that can put the
4150      compare and branch in different basic blocks.  */
4151   if (cfun->can_throw_non_call_exceptions)
4152     {
4153       if (may_trap_p (x))
4154         x = force_reg (mode, x);
4155       if (may_trap_p (y))
4156         y = force_reg (mode, y);
4157     }
4158
4159   if (GET_MODE_CLASS (mode) == MODE_CC)
4160     {
4161       gcc_assert (can_compare_p (comparison, CCmode, ccp_jump));
4162       *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4163       return;
4164     }
4165
4166   mclass = GET_MODE_CLASS (mode);
4167   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4168   cmp_mode = mode;
4169   do
4170    {
4171       enum insn_code icode;
4172       icode = optab_handler (cbranch_optab, cmp_mode);
4173       if (icode != CODE_FOR_nothing
4174           && insn_operand_matches (icode, 0, test))
4175         {
4176           rtx last = get_last_insn ();
4177           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
4178           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
4179           if (op0 && op1
4180               && insn_operand_matches (icode, 1, op0)
4181               && insn_operand_matches (icode, 2, op1))
4182             {
4183               XEXP (test, 0) = op0;
4184               XEXP (test, 1) = op1;
4185               *ptest = test;
4186               *pmode = cmp_mode;
4187               return;
4188             }
4189           delete_insns_since (last);
4190         }
4191
4192       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
4193         break;
4194       cmp_mode = GET_MODE_WIDER_MODE (cmp_mode);
4195     }
4196   while (cmp_mode != VOIDmode);
4197
4198   if (methods != OPTAB_LIB_WIDEN)
4199     goto fail;
4200
4201   if (!SCALAR_FLOAT_MODE_P (mode))
4202     {
4203       rtx result;
4204       enum machine_mode ret_mode;
4205
4206       /* Handle a libcall just for the mode we are using.  */
4207       libfunc = optab_libfunc (cmp_optab, mode);
4208       gcc_assert (libfunc);
4209
4210       /* If we want unsigned, and this mode has a distinct unsigned
4211          comparison routine, use that.  */
4212       if (unsignedp)
4213         {
4214           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
4215           if (ulibfunc)
4216             libfunc = ulibfunc;
4217         }
4218
4219       ret_mode = targetm.libgcc_cmp_return_mode ();
4220       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4221                                         ret_mode, 2, x, mode, y, mode);
4222
4223       /* There are two kinds of comparison routines. Biased routines
4224          return 0/1/2, and unbiased routines return -1/0/1. Other parts
4225          of gcc expect that the comparison operation is equivalent
4226          to the modified comparison. For signed comparisons compare the
4227          result against 1 in the biased case, and zero in the unbiased
4228          case. For unsigned comparisons always compare against 1 after
4229          biasing the unbiased result by adding 1. This gives us a way to
4230          represent LTU.
4231          The comparisons in the fixed-point helper library are always
4232          biased.  */
4233       x = result;
4234       y = const1_rtx;
4235
4236       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4237         {
4238           if (unsignedp)
4239             x = plus_constant (ret_mode, result, 1);
4240           else
4241             y = const0_rtx;
4242         }
4243
4244       *pmode = ret_mode;
4245       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4246                         ptest, pmode);
4247     }
4248   else
4249     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
4250
4251   return;
4252
4253  fail:
4254   *ptest = NULL_RTX;
4255 }
4256
4257 /* Before emitting an insn with code ICODE, make sure that X, which is going
4258    to be used for operand OPNUM of the insn, is converted from mode MODE to
4259    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4260    that it is accepted by the operand predicate.  Return the new value.  */
4261
4262 rtx
4263 prepare_operand (enum insn_code icode, rtx x, int opnum, enum machine_mode mode,
4264                  enum machine_mode wider_mode, int unsignedp)
4265 {
4266   if (mode != wider_mode)
4267     x = convert_modes (wider_mode, mode, x, unsignedp);
4268
4269   if (!insn_operand_matches (icode, opnum, x))
4270     {
4271       if (reload_completed)
4272         return NULL_RTX;
4273       x = copy_to_mode_reg (insn_data[(int) icode].operand[opnum].mode, x);
4274     }
4275
4276   return x;
4277 }
4278
4279 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4280    we can do the branch.  */
4281
4282 static void
4283 emit_cmp_and_jump_insn_1 (rtx test, enum machine_mode mode, rtx label, int prob)
4284 {
4285   enum machine_mode optab_mode;
4286   enum mode_class mclass;
4287   enum insn_code icode;
4288   rtx insn;
4289
4290   mclass = GET_MODE_CLASS (mode);
4291   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4292   icode = optab_handler (cbranch_optab, optab_mode);
4293
4294   gcc_assert (icode != CODE_FOR_nothing);
4295   gcc_assert (insn_operand_matches (icode, 0, test));
4296   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4297                                           XEXP (test, 1), label));
4298   if (prob != -1
4299       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4300       && insn
4301       && JUMP_P (insn)
4302       && any_condjump_p (insn)
4303       && !find_reg_note (insn, REG_BR_PROB, 0))
4304     add_int_reg_note (insn, REG_BR_PROB, prob);
4305 }
4306
4307 /* Generate code to compare X with Y so that the condition codes are
4308    set and to jump to LABEL if the condition is true.  If X is a
4309    constant and Y is not a constant, then the comparison is swapped to
4310    ensure that the comparison RTL has the canonical form.
4311
4312    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4313    need to be widened.  UNSIGNEDP is also used to select the proper
4314    branch condition code.
4315
4316    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4317
4318    MODE is the mode of the inputs (in case they are const_int).
4319
4320    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4321    It will be potentially converted into an unsigned variant based on
4322    UNSIGNEDP to select a proper jump instruction.
4323
4324    PROB is the probability of jumping to LABEL.  */
4325
4326 void
4327 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4328                          enum machine_mode mode, int unsignedp, rtx label,
4329                          int prob)
4330 {
4331   rtx op0 = x, op1 = y;
4332   rtx test;
4333
4334   /* Swap operands and condition to ensure canonical RTL.  */
4335   if (swap_commutative_operands_p (x, y)
4336       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4337     {
4338       op0 = y, op1 = x;
4339       comparison = swap_condition (comparison);
4340     }
4341
4342   /* If OP0 is still a constant, then both X and Y must be constants
4343      or the opposite comparison is not supported.  Force X into a register
4344      to create canonical RTL.  */
4345   if (CONSTANT_P (op0))
4346     op0 = force_reg (mode, op0);
4347
4348   if (unsignedp)
4349     comparison = unsigned_condition (comparison);
4350
4351   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4352                     &test, &mode);
4353   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4354 }
4355
4356 \f
4357 /* Emit a library call comparison between floating point X and Y.
4358    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4359
4360 static void
4361 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4362                        rtx *ptest, enum machine_mode *pmode)
4363 {
4364   enum rtx_code swapped = swap_condition (comparison);
4365   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4366   enum machine_mode orig_mode = GET_MODE (x);
4367   enum machine_mode mode, cmp_mode;
4368   rtx true_rtx, false_rtx;
4369   rtx value, target, insns, equiv;
4370   rtx libfunc = 0;
4371   bool reversed_p = false;
4372   cmp_mode = targetm.libgcc_cmp_return_mode ();
4373
4374   for (mode = orig_mode;
4375        mode != VOIDmode;
4376        mode = GET_MODE_WIDER_MODE (mode))
4377     {
4378       if (code_to_optab (comparison)
4379           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4380         break;
4381
4382       if (code_to_optab (swapped)
4383           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4384         {
4385           rtx tmp;
4386           tmp = x; x = y; y = tmp;
4387           comparison = swapped;
4388           break;
4389         }
4390
4391       if (code_to_optab (reversed)
4392           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4393         {
4394           comparison = reversed;
4395           reversed_p = true;
4396           break;
4397         }
4398     }
4399
4400   gcc_assert (mode != VOIDmode);
4401
4402   if (mode != orig_mode)
4403     {
4404       x = convert_to_mode (mode, x, 0);
4405       y = convert_to_mode (mode, y, 0);
4406     }
4407
4408   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4409      the RTL.  The allows the RTL optimizers to delete the libcall if the
4410      condition can be determined at compile-time.  */
4411   if (comparison == UNORDERED
4412       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4413     {
4414       true_rtx = const_true_rtx;
4415       false_rtx = const0_rtx;
4416     }
4417   else
4418     {
4419       switch (comparison)
4420         {
4421         case EQ:
4422           true_rtx = const0_rtx;
4423           false_rtx = const_true_rtx;
4424           break;
4425
4426         case NE:
4427           true_rtx = const_true_rtx;
4428           false_rtx = const0_rtx;
4429           break;
4430
4431         case GT:
4432           true_rtx = const1_rtx;
4433           false_rtx = const0_rtx;
4434           break;
4435
4436         case GE:
4437           true_rtx = const0_rtx;
4438           false_rtx = constm1_rtx;
4439           break;
4440
4441         case LT:
4442           true_rtx = constm1_rtx;
4443           false_rtx = const0_rtx;
4444           break;
4445
4446         case LE:
4447           true_rtx = const0_rtx;
4448           false_rtx = const1_rtx;
4449           break;
4450
4451         default:
4452           gcc_unreachable ();
4453         }
4454     }
4455
4456   if (comparison == UNORDERED)
4457     {
4458       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4459       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4460       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4461                                     temp, const_true_rtx, equiv);
4462     }
4463   else
4464     {
4465       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4466       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4467         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4468                                       equiv, true_rtx, false_rtx);
4469     }
4470
4471   start_sequence ();
4472   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4473                                    cmp_mode, 2, x, mode, y, mode);
4474   insns = get_insns ();
4475   end_sequence ();
4476
4477   target = gen_reg_rtx (cmp_mode);
4478   emit_libcall_block (insns, target, value, equiv);
4479
4480   if (comparison == UNORDERED
4481       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4482       || reversed_p)
4483     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4484   else
4485     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4486
4487   *pmode = cmp_mode;
4488 }
4489 \f
4490 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4491
4492 void
4493 emit_indirect_jump (rtx loc)
4494 {
4495   struct expand_operand ops[1];
4496
4497   create_address_operand (&ops[0], loc);
4498   expand_jump_insn (CODE_FOR_indirect_jump, 1, ops);
4499   emit_barrier ();
4500 }
4501 \f
4502 #ifdef HAVE_conditional_move
4503
4504 /* Emit a conditional move instruction if the machine supports one for that
4505    condition and machine mode.
4506
4507    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4508    the mode to use should they be constants.  If it is VOIDmode, they cannot
4509    both be constants.
4510
4511    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4512    should be stored there.  MODE is the mode to use should they be constants.
4513    If it is VOIDmode, they cannot both be constants.
4514
4515    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4516    is not supported.  */
4517
4518 rtx
4519 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4520                        enum machine_mode cmode, rtx op2, rtx op3,
4521                        enum machine_mode mode, int unsignedp)
4522 {
4523   rtx tem, comparison, last;
4524   enum insn_code icode;
4525   enum rtx_code reversed;
4526
4527   /* If one operand is constant, make it the second one.  Only do this
4528      if the other operand is not constant as well.  */
4529
4530   if (swap_commutative_operands_p (op0, op1))
4531     {
4532       tem = op0;
4533       op0 = op1;
4534       op1 = tem;
4535       code = swap_condition (code);
4536     }
4537
4538   /* get_condition will prefer to generate LT and GT even if the old
4539      comparison was against zero, so undo that canonicalization here since
4540      comparisons against zero are cheaper.  */
4541   if (code == LT && op1 == const1_rtx)
4542     code = LE, op1 = const0_rtx;
4543   else if (code == GT && op1 == constm1_rtx)
4544     code = GE, op1 = const0_rtx;
4545
4546   if (cmode == VOIDmode)
4547     cmode = GET_MODE (op0);
4548
4549   if (swap_commutative_operands_p (op2, op3)
4550       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4551           != UNKNOWN))
4552     {
4553       tem = op2;
4554       op2 = op3;
4555       op3 = tem;
4556       code = reversed;
4557     }
4558
4559   if (mode == VOIDmode)
4560     mode = GET_MODE (op2);
4561
4562   icode = direct_optab_handler (movcc_optab, mode);
4563
4564   if (icode == CODE_FOR_nothing)
4565     return 0;
4566
4567   if (!target)
4568     target = gen_reg_rtx (mode);
4569
4570   code = unsignedp ? unsigned_condition (code) : code;
4571   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4572
4573   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4574      return NULL and let the caller figure out how best to deal with this
4575      situation.  */
4576   if (!COMPARISON_P (comparison))
4577     return NULL_RTX;
4578
4579   saved_pending_stack_adjust save;
4580   save_pending_stack_adjust (&save);
4581   last = get_last_insn ();
4582   do_pending_stack_adjust ();
4583   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4584                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4585                     &comparison, &cmode);
4586   if (comparison)
4587     {
4588       struct expand_operand ops[4];
4589
4590       create_output_operand (&ops[0], target, mode);
4591       create_fixed_operand (&ops[1], comparison);
4592       create_input_operand (&ops[2], op2, mode);
4593       create_input_operand (&ops[3], op3, mode);
4594       if (maybe_expand_insn (icode, 4, ops))
4595         {
4596           if (ops[0].value != target)
4597             convert_move (target, ops[0].value, false);
4598           return target;
4599         }
4600     }
4601   delete_insns_since (last);
4602   restore_pending_stack_adjust (&save);
4603   return NULL_RTX;
4604 }
4605
4606 /* Return nonzero if a conditional move of mode MODE is supported.
4607
4608    This function is for combine so it can tell whether an insn that looks
4609    like a conditional move is actually supported by the hardware.  If we
4610    guess wrong we lose a bit on optimization, but that's it.  */
4611 /* ??? sparc64 supports conditionally moving integers values based on fp
4612    comparisons, and vice versa.  How do we handle them?  */
4613
4614 int
4615 can_conditionally_move_p (enum machine_mode mode)
4616 {
4617   if (direct_optab_handler (movcc_optab, mode) != CODE_FOR_nothing)
4618     return 1;
4619
4620   return 0;
4621 }
4622
4623 #endif /* HAVE_conditional_move */
4624
4625 /* Emit a conditional addition instruction if the machine supports one for that
4626    condition and machine mode.
4627
4628    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4629    the mode to use should they be constants.  If it is VOIDmode, they cannot
4630    both be constants.
4631
4632    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4633    should be stored there.  MODE is the mode to use should they be constants.
4634    If it is VOIDmode, they cannot both be constants.
4635
4636    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4637    is not supported.  */
4638
4639 rtx
4640 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4641                       enum machine_mode cmode, rtx op2, rtx op3,
4642                       enum machine_mode mode, int unsignedp)
4643 {
4644   rtx tem, comparison, last;
4645   enum insn_code icode;
4646
4647   /* If one operand is constant, make it the second one.  Only do this
4648      if the other operand is not constant as well.  */
4649
4650   if (swap_commutative_operands_p (op0, op1))
4651     {
4652       tem = op0;
4653       op0 = op1;
4654       op1 = tem;
4655       code = swap_condition (code);
4656     }
4657
4658   /* get_condition will prefer to generate LT and GT even if the old
4659      comparison was against zero, so undo that canonicalization here since
4660      comparisons against zero are cheaper.  */
4661   if (code == LT && op1 == const1_rtx)
4662     code = LE, op1 = const0_rtx;
4663   else if (code == GT && op1 == constm1_rtx)
4664     code = GE, op1 = const0_rtx;
4665
4666   if (cmode == VOIDmode)
4667     cmode = GET_MODE (op0);
4668
4669   if (mode == VOIDmode)
4670     mode = GET_MODE (op2);
4671
4672   icode = optab_handler (addcc_optab, mode);
4673
4674   if (icode == CODE_FOR_nothing)
4675     return 0;
4676
4677   if (!target)
4678     target = gen_reg_rtx (mode);
4679
4680   code = unsignedp ? unsigned_condition (code) : code;
4681   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4682
4683   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4684      return NULL and let the caller figure out how best to deal with this
4685      situation.  */
4686   if (!COMPARISON_P (comparison))
4687     return NULL_RTX;
4688
4689   do_pending_stack_adjust ();
4690   last = get_last_insn ();
4691   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4692                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4693                     &comparison, &cmode);
4694   if (comparison)
4695     {
4696       struct expand_operand ops[4];
4697
4698       create_output_operand (&ops[0], target, mode);
4699       create_fixed_operand (&ops[1], comparison);
4700       create_input_operand (&ops[2], op2, mode);
4701       create_input_operand (&ops[3], op3, mode);
4702       if (maybe_expand_insn (icode, 4, ops))
4703         {
4704           if (ops[0].value != target)
4705             convert_move (target, ops[0].value, false);
4706           return target;
4707         }
4708     }
4709   delete_insns_since (last);
4710   return NULL_RTX;
4711 }
4712 \f
4713 /* These functions attempt to generate an insn body, rather than
4714    emitting the insn, but if the gen function already emits them, we
4715    make no attempt to turn them back into naked patterns.  */
4716
4717 /* Generate and return an insn body to add Y to X.  */
4718
4719 rtx
4720 gen_add2_insn (rtx x, rtx y)
4721 {
4722   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4723
4724   gcc_assert (insn_operand_matches (icode, 0, x));
4725   gcc_assert (insn_operand_matches (icode, 1, x));
4726   gcc_assert (insn_operand_matches (icode, 2, y));
4727
4728   return GEN_FCN (icode) (x, x, y);
4729 }
4730
4731 /* Generate and return an insn body to add r1 and c,
4732    storing the result in r0.  */
4733
4734 rtx
4735 gen_add3_insn (rtx r0, rtx r1, rtx c)
4736 {
4737   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4738
4739   if (icode == CODE_FOR_nothing
4740       || !insn_operand_matches (icode, 0, r0)
4741       || !insn_operand_matches (icode, 1, r1)
4742       || !insn_operand_matches (icode, 2, c))
4743     return NULL_RTX;
4744
4745   return GEN_FCN (icode) (r0, r1, c);
4746 }
4747
4748 int
4749 have_add2_insn (rtx x, rtx y)
4750 {
4751   enum insn_code icode;
4752
4753   gcc_assert (GET_MODE (x) != VOIDmode);
4754
4755   icode = optab_handler (add_optab, GET_MODE (x));
4756
4757   if (icode == CODE_FOR_nothing)
4758     return 0;
4759
4760   if (!insn_operand_matches (icode, 0, x)
4761       || !insn_operand_matches (icode, 1, x)
4762       || !insn_operand_matches (icode, 2, y))
4763     return 0;
4764
4765   return 1;
4766 }
4767
4768 /* Generate and return an insn body to add Y to X.  */
4769
4770 rtx
4771 gen_addptr3_insn (rtx x, rtx y, rtx z)
4772 {
4773   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4774
4775   gcc_assert (insn_operand_matches (icode, 0, x));
4776   gcc_assert (insn_operand_matches (icode, 1, y));
4777   gcc_assert (insn_operand_matches (icode, 2, z));
4778
4779   return GEN_FCN (icode) (x, y, z);
4780 }
4781
4782 /* Return true if the target implements an addptr pattern and X, Y,
4783    and Z are valid for the pattern predicates.  */
4784
4785 int
4786 have_addptr3_insn (rtx x, rtx y, rtx z)
4787 {
4788   enum insn_code icode;
4789
4790   gcc_assert (GET_MODE (x) != VOIDmode);
4791
4792   icode = optab_handler (addptr3_optab, GET_MODE (x));
4793
4794   if (icode == CODE_FOR_nothing)
4795     return 0;
4796
4797   if (!insn_operand_matches (icode, 0, x)
4798       || !insn_operand_matches (icode, 1, y)
4799       || !insn_operand_matches (icode, 2, z))
4800     return 0;
4801
4802   return 1;
4803 }
4804
4805 /* Generate and return an insn body to subtract Y from X.  */
4806
4807 rtx
4808 gen_sub2_insn (rtx x, rtx y)
4809 {
4810   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4811
4812   gcc_assert (insn_operand_matches (icode, 0, x));
4813   gcc_assert (insn_operand_matches (icode, 1, x));
4814   gcc_assert (insn_operand_matches (icode, 2, y));
4815
4816   return GEN_FCN (icode) (x, x, y);
4817 }
4818
4819 /* Generate and return an insn body to subtract r1 and c,
4820    storing the result in r0.  */
4821
4822 rtx
4823 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4824 {
4825   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4826
4827   if (icode == CODE_FOR_nothing
4828       || !insn_operand_matches (icode, 0, r0)
4829       || !insn_operand_matches (icode, 1, r1)
4830       || !insn_operand_matches (icode, 2, c))
4831     return NULL_RTX;
4832
4833   return GEN_FCN (icode) (r0, r1, c);
4834 }
4835
4836 int
4837 have_sub2_insn (rtx x, rtx y)
4838 {
4839   enum insn_code icode;
4840
4841   gcc_assert (GET_MODE (x) != VOIDmode);
4842
4843   icode = optab_handler (sub_optab, GET_MODE (x));
4844
4845   if (icode == CODE_FOR_nothing)
4846     return 0;
4847
4848   if (!insn_operand_matches (icode, 0, x)
4849       || !insn_operand_matches (icode, 1, x)
4850       || !insn_operand_matches (icode, 2, y))
4851     return 0;
4852
4853   return 1;
4854 }
4855
4856 /* Generate the body of an instruction to copy Y into X.
4857    It may be a list of insns, if one insn isn't enough.  */
4858
4859 rtx
4860 gen_move_insn (rtx x, rtx y)
4861 {
4862   rtx seq;
4863
4864   start_sequence ();
4865   emit_move_insn_1 (x, y);
4866   seq = get_insns ();
4867   end_sequence ();
4868   return seq;
4869 }
4870 \f
4871 /* Return the insn code used to extend FROM_MODE to TO_MODE.
4872    UNSIGNEDP specifies zero-extension instead of sign-extension.  If
4873    no such operation exists, CODE_FOR_nothing will be returned.  */
4874
4875 enum insn_code
4876 can_extend_p (enum machine_mode to_mode, enum machine_mode from_mode,
4877               int unsignedp)
4878 {
4879   convert_optab tab;
4880 #ifdef HAVE_ptr_extend
4881   if (unsignedp < 0)
4882     return CODE_FOR_ptr_extend;
4883 #endif
4884
4885   tab = unsignedp ? zext_optab : sext_optab;
4886   return convert_optab_handler (tab, to_mode, from_mode);
4887 }
4888
4889 /* Generate the body of an insn to extend Y (with mode MFROM)
4890    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4891
4892 rtx
4893 gen_extend_insn (rtx x, rtx y, enum machine_mode mto,
4894                  enum machine_mode mfrom, int unsignedp)
4895 {
4896   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4897   return GEN_FCN (icode) (x, y);
4898 }
4899 \f
4900 /* can_fix_p and can_float_p say whether the target machine
4901    can directly convert a given fixed point type to
4902    a given floating point type, or vice versa.
4903    The returned value is the CODE_FOR_... value to use,
4904    or CODE_FOR_nothing if these modes cannot be directly converted.
4905
4906    *TRUNCP_PTR is set to 1 if it is necessary to output
4907    an explicit FTRUNC insn before the fix insn; otherwise 0.  */
4908
4909 static enum insn_code
4910 can_fix_p (enum machine_mode fixmode, enum machine_mode fltmode,
4911            int unsignedp, int *truncp_ptr)
4912 {
4913   convert_optab tab;
4914   enum insn_code icode;
4915
4916   tab = unsignedp ? ufixtrunc_optab : sfixtrunc_optab;
4917   icode = convert_optab_handler (tab, fixmode, fltmode);
4918   if (icode != CODE_FOR_nothing)
4919     {
4920       *truncp_ptr = 0;
4921       return icode;
4922     }
4923
4924   /* FIXME: This requires a port to define both FIX and FTRUNC pattern
4925      for this to work. We need to rework the fix* and ftrunc* patterns
4926      and documentation.  */
4927   tab = unsignedp ? ufix_optab : sfix_optab;
4928   icode = convert_optab_handler (tab, fixmode, fltmode);
4929   if (icode != CODE_FOR_nothing
4930       && optab_handler (ftrunc_optab, fltmode) != CODE_FOR_nothing)
4931     {
4932       *truncp_ptr = 1;
4933       return icode;
4934     }
4935
4936   *truncp_ptr = 0;
4937   return CODE_FOR_nothing;
4938 }
4939
4940 enum insn_code
4941 can_float_p (enum machine_mode fltmode, enum machine_mode fixmode,
4942              int unsignedp)
4943 {
4944   convert_optab tab;
4945
4946   tab = unsignedp ? ufloat_optab : sfloat_optab;
4947   return convert_optab_handler (tab, fltmode, fixmode);
4948 }
4949
4950 /* Function supportable_convert_operation
4951
4952    Check whether an operation represented by the code CODE is a
4953    convert operation that is supported by the target platform in
4954    vector form (i.e., when operating on arguments of type VECTYPE_IN
4955    producing a result of type VECTYPE_OUT).
4956
4957    Convert operations we currently support directly are FIX_TRUNC and FLOAT.
4958    This function checks if these operations are supported
4959    by the target platform either directly (via vector tree-codes), or via
4960    target builtins.
4961
4962    Output:
4963    - CODE1 is code of vector operation to be used when
4964    vectorizing the operation, if available.
4965    - DECL is decl of target builtin functions to be used
4966    when vectorizing the operation, if available.  In this case,
4967    CODE1 is CALL_EXPR.  */
4968
4969 bool
4970 supportable_convert_operation (enum tree_code code,
4971                                     tree vectype_out, tree vectype_in,
4972                                     tree *decl, enum tree_code *code1)
4973 {
4974   enum machine_mode m1,m2;
4975   int truncp;
4976
4977   m1 = TYPE_MODE (vectype_out);
4978   m2 = TYPE_MODE (vectype_in);
4979
4980   /* First check if we can done conversion directly.  */
4981   if ((code == FIX_TRUNC_EXPR
4982        && can_fix_p (m1,m2,TYPE_UNSIGNED (vectype_out), &truncp)
4983           != CODE_FOR_nothing)
4984       || (code == FLOAT_EXPR
4985           && can_float_p (m1,m2,TYPE_UNSIGNED (vectype_in))
4986              != CODE_FOR_nothing))
4987     {
4988       *code1 = code;
4989       return true;
4990     }
4991
4992   /* Now check for builtin.  */
4993   if (targetm.vectorize.builtin_conversion
4994       && targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in))
4995     {
4996       *code1 = CALL_EXPR;
4997       *decl = targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in);
4998       return true;
4999     }
5000   return false;
5001 }
5002
5003 \f
5004 /* Generate code to convert FROM to floating point
5005    and store in TO.  FROM must be fixed point and not VOIDmode.
5006    UNSIGNEDP nonzero means regard FROM as unsigned.
5007    Normally this is done by correcting the final value
5008    if it is negative.  */
5009
5010 void
5011 expand_float (rtx to, rtx from, int unsignedp)
5012 {
5013   enum insn_code icode;
5014   rtx target = to;
5015   enum machine_mode fmode, imode;
5016   bool can_do_signed = false;
5017
5018   /* Crash now, because we won't be able to decide which mode to use.  */
5019   gcc_assert (GET_MODE (from) != VOIDmode);
5020
5021   /* Look for an insn to do the conversion.  Do it in the specified
5022      modes if possible; otherwise convert either input, output or both to
5023      wider mode.  If the integer mode is wider than the mode of FROM,
5024      we can do the conversion signed even if the input is unsigned.  */
5025
5026   for (fmode = GET_MODE (to); fmode != VOIDmode;
5027        fmode = GET_MODE_WIDER_MODE (fmode))
5028     for (imode = GET_MODE (from); imode != VOIDmode;
5029          imode = GET_MODE_WIDER_MODE (imode))
5030       {
5031         int doing_unsigned = unsignedp;
5032
5033         if (fmode != GET_MODE (to)
5034             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
5035           continue;
5036
5037         icode = can_float_p (fmode, imode, unsignedp);
5038         if (icode == CODE_FOR_nothing && unsignedp)
5039           {
5040             enum insn_code scode = can_float_p (fmode, imode, 0);
5041             if (scode != CODE_FOR_nothing)
5042               can_do_signed = true;
5043             if (imode != GET_MODE (from))
5044               icode = scode, doing_unsigned = 0;
5045           }
5046
5047         if (icode != CODE_FOR_nothing)
5048           {
5049             if (imode != GET_MODE (from))
5050               from = convert_to_mode (imode, from, unsignedp);
5051
5052             if (fmode != GET_MODE (to))
5053               target = gen_reg_rtx (fmode);
5054
5055             emit_unop_insn (icode, target, from,
5056                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
5057
5058             if (target != to)
5059               convert_move (to, target, 0);
5060             return;
5061           }
5062       }
5063
5064   /* Unsigned integer, and no way to convert directly.  Convert as signed,
5065      then unconditionally adjust the result.  */
5066   if (unsignedp && can_do_signed)
5067     {
5068       rtx label = gen_label_rtx ();
5069       rtx temp;
5070       REAL_VALUE_TYPE offset;
5071
5072       /* Look for a usable floating mode FMODE wider than the source and at
5073          least as wide as the target.  Using FMODE will avoid rounding woes
5074          with unsigned values greater than the signed maximum value.  */
5075
5076       for (fmode = GET_MODE (to);  fmode != VOIDmode;
5077            fmode = GET_MODE_WIDER_MODE (fmode))
5078         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
5079             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
5080           break;
5081
5082       if (fmode == VOIDmode)
5083         {
5084           /* There is no such mode.  Pretend the target is wide enough.  */
5085           fmode = GET_MODE (to);
5086
5087           /* Avoid double-rounding when TO is narrower than FROM.  */
5088           if ((significand_size (fmode) + 1)
5089               < GET_MODE_PRECISION (GET_MODE (from)))
5090             {
5091               rtx temp1;
5092               rtx neglabel = gen_label_rtx ();
5093
5094               /* Don't use TARGET if it isn't a register, is a hard register,
5095                  or is the wrong mode.  */
5096               if (!REG_P (target)
5097                   || REGNO (target) < FIRST_PSEUDO_REGISTER
5098                   || GET_MODE (target) != fmode)
5099                 target = gen_reg_rtx (fmode);
5100
5101               imode = GET_MODE (from);
5102               do_pending_stack_adjust ();
5103
5104               /* Test whether the sign bit is set.  */
5105               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
5106                                        0, neglabel);
5107
5108               /* The sign bit is not set.  Convert as signed.  */
5109               expand_float (target, from, 0);
5110               emit_jump_insn (gen_jump (label));
5111               emit_barrier ();
5112
5113               /* The sign bit is set.
5114                  Convert to a usable (positive signed) value by shifting right
5115                  one bit, while remembering if a nonzero bit was shifted
5116                  out; i.e., compute  (from & 1) | (from >> 1).  */
5117
5118               emit_label (neglabel);
5119               temp = expand_binop (imode, and_optab, from, const1_rtx,
5120                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
5121               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
5122               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
5123                                    OPTAB_LIB_WIDEN);
5124               expand_float (target, temp, 0);
5125
5126               /* Multiply by 2 to undo the shift above.  */
5127               temp = expand_binop (fmode, add_optab, target, target,
5128                                    target, 0, OPTAB_LIB_WIDEN);
5129               if (temp != target)
5130                 emit_move_insn (target, temp);
5131
5132               do_pending_stack_adjust ();
5133               emit_label (label);
5134               goto done;
5135             }
5136         }
5137
5138       /* If we are about to do some arithmetic to correct for an
5139          unsigned operand, do it in a pseudo-register.  */
5140
5141       if (GET_MODE (to) != fmode
5142           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
5143         target = gen_reg_rtx (fmode);
5144
5145       /* Convert as signed integer to floating.  */
5146       expand_float (target, from, 0);
5147
5148       /* If FROM is negative (and therefore TO is negative),
5149          correct its value by 2**bitwidth.  */
5150
5151       do_pending_stack_adjust ();
5152       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
5153                                0, label);
5154
5155
5156       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
5157       temp = expand_binop (fmode, add_optab, target,
5158                            CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode),
5159                            target, 0, OPTAB_LIB_WIDEN);
5160       if (temp != target)
5161         emit_move_insn (target, temp);
5162
5163       do_pending_stack_adjust ();
5164       emit_label (label);
5165       goto done;
5166     }
5167
5168   /* No hardware instruction available; call a library routine.  */
5169     {
5170       rtx libfunc;
5171       rtx insns;
5172       rtx value;
5173       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
5174
5175       if (GET_MODE_SIZE (GET_MODE (from)) < GET_MODE_SIZE (SImode))
5176         from = convert_to_mode (SImode, from, unsignedp);
5177
5178       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5179       gcc_assert (libfunc);
5180
5181       start_sequence ();
5182
5183       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5184                                        GET_MODE (to), 1, from,
5185                                        GET_MODE (from));
5186       insns = get_insns ();
5187       end_sequence ();
5188
5189       emit_libcall_block (insns, target, value,
5190                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
5191                                          GET_MODE (to), from));
5192     }
5193
5194  done:
5195
5196   /* Copy result to requested destination
5197      if we have been computing in a temp location.  */
5198
5199   if (target != to)
5200     {
5201       if (GET_MODE (target) == GET_MODE (to))
5202         emit_move_insn (to, target);
5203       else
5204         convert_move (to, target, 0);
5205     }
5206 }
5207 \f
5208 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5209    must be floating point.  */
5210
5211 void
5212 expand_fix (rtx to, rtx from, int unsignedp)
5213 {
5214   enum insn_code icode;
5215   rtx target = to;
5216   enum machine_mode fmode, imode;
5217   int must_trunc = 0;
5218
5219   /* We first try to find a pair of modes, one real and one integer, at
5220      least as wide as FROM and TO, respectively, in which we can open-code
5221      this conversion.  If the integer mode is wider than the mode of TO,
5222      we can do the conversion either signed or unsigned.  */
5223
5224   for (fmode = GET_MODE (from); fmode != VOIDmode;
5225        fmode = GET_MODE_WIDER_MODE (fmode))
5226     for (imode = GET_MODE (to); imode != VOIDmode;
5227          imode = GET_MODE_WIDER_MODE (imode))
5228       {
5229         int doing_unsigned = unsignedp;
5230
5231         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
5232         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
5233           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
5234
5235         if (icode != CODE_FOR_nothing)
5236           {
5237             rtx last = get_last_insn ();
5238             if (fmode != GET_MODE (from))
5239               from = convert_to_mode (fmode, from, 0);
5240
5241             if (must_trunc)
5242               {
5243                 rtx temp = gen_reg_rtx (GET_MODE (from));
5244                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
5245                                     temp, 0);
5246               }
5247
5248             if (imode != GET_MODE (to))
5249               target = gen_reg_rtx (imode);
5250
5251             if (maybe_emit_unop_insn (icode, target, from,
5252                                       doing_unsigned ? UNSIGNED_FIX : FIX))
5253               {
5254                 if (target != to)
5255                   convert_move (to, target, unsignedp);
5256                 return;
5257               }
5258             delete_insns_since (last);
5259           }
5260       }
5261
5262   /* For an unsigned conversion, there is one more way to do it.
5263      If we have a signed conversion, we generate code that compares
5264      the real value to the largest representable positive number.  If if
5265      is smaller, the conversion is done normally.  Otherwise, subtract
5266      one plus the highest signed number, convert, and add it back.
5267
5268      We only need to check all real modes, since we know we didn't find
5269      anything with a wider integer mode.
5270
5271      This code used to extend FP value into mode wider than the destination.
5272      This is needed for decimal float modes which cannot accurately
5273      represent one plus the highest signed number of the same size, but
5274      not for binary modes.  Consider, for instance conversion from SFmode
5275      into DImode.
5276
5277      The hot path through the code is dealing with inputs smaller than 2^63
5278      and doing just the conversion, so there is no bits to lose.
5279
5280      In the other path we know the value is positive in the range 2^63..2^64-1
5281      inclusive.  (as for other input overflow happens and result is undefined)
5282      So we know that the most important bit set in mantissa corresponds to
5283      2^63.  The subtraction of 2^63 should not generate any rounding as it
5284      simply clears out that bit.  The rest is trivial.  */
5285
5286   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
5287     for (fmode = GET_MODE (from); fmode != VOIDmode;
5288          fmode = GET_MODE_WIDER_MODE (fmode))
5289       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
5290           && (!DECIMAL_FLOAT_MODE_P (fmode)
5291               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
5292         {
5293           int bitsize;
5294           REAL_VALUE_TYPE offset;
5295           rtx limit, lab1, lab2, insn;
5296
5297           bitsize = GET_MODE_PRECISION (GET_MODE (to));
5298           real_2expN (&offset, bitsize - 1, fmode);
5299           limit = CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode);
5300           lab1 = gen_label_rtx ();
5301           lab2 = gen_label_rtx ();
5302
5303           if (fmode != GET_MODE (from))
5304             from = convert_to_mode (fmode, from, 0);
5305
5306           /* See if we need to do the subtraction.  */
5307           do_pending_stack_adjust ();
5308           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
5309                                    0, lab1);
5310
5311           /* If not, do the signed "fix" and branch around fixup code.  */
5312           expand_fix (to, from, 0);
5313           emit_jump_insn (gen_jump (lab2));
5314           emit_barrier ();
5315
5316           /* Otherwise, subtract 2**(N-1), convert to signed number,
5317              then add 2**(N-1).  Do the addition using XOR since this
5318              will often generate better code.  */
5319           emit_label (lab1);
5320           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5321                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
5322           expand_fix (to, target, 0);
5323           target = expand_binop (GET_MODE (to), xor_optab, to,
5324                                  gen_int_mode
5325                                  ((HOST_WIDE_INT) 1 << (bitsize - 1),
5326                                   GET_MODE (to)),
5327                                  to, 1, OPTAB_LIB_WIDEN);
5328
5329           if (target != to)
5330             emit_move_insn (to, target);
5331
5332           emit_label (lab2);
5333
5334           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
5335             {
5336               /* Make a place for a REG_NOTE and add it.  */
5337               insn = emit_move_insn (to, to);
5338               set_dst_reg_note (insn, REG_EQUAL,
5339                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
5340                                                copy_rtx (from)),
5341                                 to);
5342             }
5343
5344           return;
5345         }
5346
5347   /* We can't do it with an insn, so use a library call.  But first ensure
5348      that the mode of TO is at least as wide as SImode, since those are the
5349      only library calls we know about.  */
5350
5351   if (GET_MODE_SIZE (GET_MODE (to)) < GET_MODE_SIZE (SImode))
5352     {
5353       target = gen_reg_rtx (SImode);
5354
5355       expand_fix (target, from, unsignedp);
5356     }
5357   else
5358     {
5359       rtx insns;
5360       rtx value;
5361       rtx libfunc;
5362
5363       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5364       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5365       gcc_assert (libfunc);
5366
5367       start_sequence ();
5368
5369       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5370                                        GET_MODE (to), 1, from,
5371                                        GET_MODE (from));
5372       insns = get_insns ();
5373       end_sequence ();
5374
5375       emit_libcall_block (insns, target, value,
5376                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5377                                          GET_MODE (to), from));
5378     }
5379
5380   if (target != to)
5381     {
5382       if (GET_MODE (to) == GET_MODE (target))
5383         emit_move_insn (to, target);
5384       else
5385         convert_move (to, target, 0);
5386     }
5387 }
5388
5389 /* Generate code to convert FROM or TO a fixed-point.
5390    If UINTP is true, either TO or FROM is an unsigned integer.
5391    If SATP is true, we need to saturate the result.  */
5392
5393 void
5394 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5395 {
5396   enum machine_mode to_mode = GET_MODE (to);
5397   enum machine_mode from_mode = GET_MODE (from);
5398   convert_optab tab;
5399   enum rtx_code this_code;
5400   enum insn_code code;
5401   rtx insns, value;
5402   rtx libfunc;
5403
5404   if (to_mode == from_mode)
5405     {
5406       emit_move_insn (to, from);
5407       return;
5408     }
5409
5410   if (uintp)
5411     {
5412       tab = satp ? satfractuns_optab : fractuns_optab;
5413       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5414     }
5415   else
5416     {
5417       tab = satp ? satfract_optab : fract_optab;
5418       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5419     }
5420   code = convert_optab_handler (tab, to_mode, from_mode);
5421   if (code != CODE_FOR_nothing)
5422     {
5423       emit_unop_insn (code, to, from, this_code);
5424       return;
5425     }
5426
5427   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5428   gcc_assert (libfunc);
5429
5430   start_sequence ();
5431   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5432                                    1, from, from_mode);
5433   insns = get_insns ();
5434   end_sequence ();
5435
5436   emit_libcall_block (insns, to, value,
5437                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5438 }
5439
5440 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5441    must be floating point, TO must be signed.  Use the conversion optab
5442    TAB to do the conversion.  */
5443
5444 bool
5445 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5446 {
5447   enum insn_code icode;
5448   rtx target = to;
5449   enum machine_mode fmode, imode;
5450
5451   /* We first try to find a pair of modes, one real and one integer, at
5452      least as wide as FROM and TO, respectively, in which we can open-code
5453      this conversion.  If the integer mode is wider than the mode of TO,
5454      we can do the conversion either signed or unsigned.  */
5455
5456   for (fmode = GET_MODE (from); fmode != VOIDmode;
5457        fmode = GET_MODE_WIDER_MODE (fmode))
5458     for (imode = GET_MODE (to); imode != VOIDmode;
5459          imode = GET_MODE_WIDER_MODE (imode))
5460       {
5461         icode = convert_optab_handler (tab, imode, fmode);
5462         if (icode != CODE_FOR_nothing)
5463           {
5464             rtx last = get_last_insn ();
5465             if (fmode != GET_MODE (from))
5466               from = convert_to_mode (fmode, from, 0);
5467
5468             if (imode != GET_MODE (to))
5469               target = gen_reg_rtx (imode);
5470
5471             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5472               {
5473                 delete_insns_since (last);
5474                 continue;
5475               }
5476             if (target != to)
5477               convert_move (to, target, 0);
5478             return true;
5479           }
5480       }
5481
5482   return false;
5483 }
5484 \f
5485 /* Report whether we have an instruction to perform the operation
5486    specified by CODE on operands of mode MODE.  */
5487 int
5488 have_insn_for (enum rtx_code code, enum machine_mode mode)
5489 {
5490   return (code_to_optab (code)
5491           && (optab_handler (code_to_optab (code), mode)
5492               != CODE_FOR_nothing));
5493 }
5494
5495 /* Initialize the libfunc fields of an entire group of entries in some
5496    optab.  Each entry is set equal to a string consisting of a leading
5497    pair of underscores followed by a generic operation name followed by
5498    a mode name (downshifted to lowercase) followed by a single character
5499    representing the number of operands for the given operation (which is
5500    usually one of the characters '2', '3', or '4').
5501
5502    OPTABLE is the table in which libfunc fields are to be initialized.
5503    OPNAME is the generic (string) name of the operation.
5504    SUFFIX is the character which specifies the number of operands for
5505      the given generic operation.
5506    MODE is the mode to generate for.
5507 */
5508
5509 static void
5510 gen_libfunc (optab optable, const char *opname, int suffix,
5511              enum machine_mode mode)
5512 {
5513   unsigned opname_len = strlen (opname);
5514   const char *mname = GET_MODE_NAME (mode);
5515   unsigned mname_len = strlen (mname);
5516   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5517   int len = prefix_len + opname_len + mname_len + 1 + 1;
5518   char *libfunc_name = XALLOCAVEC (char, len);
5519   char *p;
5520   const char *q;
5521
5522   p = libfunc_name;
5523   *p++ = '_';
5524   *p++ = '_';
5525   if (targetm.libfunc_gnu_prefix)
5526     {
5527       *p++ = 'g';
5528       *p++ = 'n';
5529       *p++ = 'u';
5530       *p++ = '_';
5531     }
5532   for (q = opname; *q; )
5533     *p++ = *q++;
5534   for (q = mname; *q; q++)
5535     *p++ = TOLOWER (*q);
5536   *p++ = suffix;
5537   *p = '\0';
5538
5539   set_optab_libfunc (optable, mode,
5540                      ggc_alloc_string (libfunc_name, p - libfunc_name));
5541 }
5542
5543 /* Like gen_libfunc, but verify that integer operation is involved.  */
5544
5545 void
5546 gen_int_libfunc (optab optable, const char *opname, char suffix,
5547                  enum machine_mode mode)
5548 {
5549   int maxsize = 2 * BITS_PER_WORD;
5550
5551   if (GET_MODE_CLASS (mode) != MODE_INT)
5552     return;
5553   if (maxsize < LONG_LONG_TYPE_SIZE)
5554     maxsize = LONG_LONG_TYPE_SIZE;
5555   if (GET_MODE_CLASS (mode) != MODE_INT
5556       || GET_MODE_BITSIZE (mode) < BITS_PER_WORD
5557       || GET_MODE_BITSIZE (mode) > maxsize)
5558     return;
5559   gen_libfunc (optable, opname, suffix, mode);
5560 }
5561
5562 /* Like gen_libfunc, but verify that FP and set decimal prefix if needed.  */
5563
5564 void
5565 gen_fp_libfunc (optab optable, const char *opname, char suffix,
5566                 enum machine_mode mode)
5567 {
5568   char *dec_opname;
5569
5570   if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5571     gen_libfunc (optable, opname, suffix, mode);
5572   if (DECIMAL_FLOAT_MODE_P (mode))
5573     {
5574       dec_opname = XALLOCAVEC (char, sizeof (DECIMAL_PREFIX) + strlen (opname));
5575       /* For BID support, change the name to have either a bid_ or dpd_ prefix
5576          depending on the low level floating format used.  */
5577       memcpy (dec_opname, DECIMAL_PREFIX, sizeof (DECIMAL_PREFIX) - 1);
5578       strcpy (dec_opname + sizeof (DECIMAL_PREFIX) - 1, opname);
5579       gen_libfunc (optable, dec_opname, suffix, mode);
5580     }
5581 }
5582
5583 /* Like gen_libfunc, but verify that fixed-point operation is involved.  */
5584
5585 void
5586 gen_fixed_libfunc (optab optable, const char *opname, char suffix,
5587                    enum machine_mode mode)
5588 {
5589   if (!ALL_FIXED_POINT_MODE_P (mode))
5590     return;
5591   gen_libfunc (optable, opname, suffix, mode);
5592 }
5593
5594 /* Like gen_libfunc, but verify that signed fixed-point operation is
5595    involved.  */
5596
5597 void
5598 gen_signed_fixed_libfunc (optab optable, const char *opname, char suffix,
5599                           enum machine_mode mode)
5600 {
5601   if (!SIGNED_FIXED_POINT_MODE_P (mode))
5602     return;
5603   gen_libfunc (optable, opname, suffix, mode);
5604 }
5605
5606 /* Like gen_libfunc, but verify that unsigned fixed-point operation is
5607    involved.  */
5608
5609 void
5610 gen_unsigned_fixed_libfunc (optab optable, const char *opname, char suffix,
5611                             enum machine_mode mode)
5612 {
5613   if (!UNSIGNED_FIXED_POINT_MODE_P (mode))
5614     return;
5615   gen_libfunc (optable, opname, suffix, mode);
5616 }
5617
5618 /* Like gen_libfunc, but verify that FP or INT operation is involved.  */
5619
5620 void
5621 gen_int_fp_libfunc (optab optable, const char *name, char suffix,
5622                     enum machine_mode mode)
5623 {
5624   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5625     gen_fp_libfunc (optable, name, suffix, mode);
5626   if (INTEGRAL_MODE_P (mode))
5627     gen_int_libfunc (optable, name, suffix, mode);
5628 }
5629
5630 /* Like gen_libfunc, but verify that FP or INT operation is involved
5631    and add 'v' suffix for integer operation.  */
5632
5633 void
5634 gen_intv_fp_libfunc (optab optable, const char *name, char suffix,
5635                      enum machine_mode mode)
5636 {
5637   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5638     gen_fp_libfunc (optable, name, suffix, mode);
5639   if (GET_MODE_CLASS (mode) == MODE_INT)
5640     {
5641       int len = strlen (name);
5642       char *v_name = XALLOCAVEC (char, len + 2);
5643       strcpy (v_name, name);
5644       v_name[len] = 'v';
5645       v_name[len + 1] = 0;
5646       gen_int_libfunc (optable, v_name, suffix, mode);
5647     }
5648 }
5649
5650 /* Like gen_libfunc, but verify that FP or INT or FIXED operation is
5651    involved.  */
5652
5653 void
5654 gen_int_fp_fixed_libfunc (optab optable, const char *name, char suffix,
5655                           enum machine_mode mode)
5656 {
5657   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5658     gen_fp_libfunc (optable, name, suffix, mode);
5659   if (INTEGRAL_MODE_P (mode))
5660     gen_int_libfunc (optable, name, suffix, mode);
5661   if (ALL_FIXED_POINT_MODE_P (mode))
5662     gen_fixed_libfunc (optable, name, suffix, mode);
5663 }
5664
5665 /* Like gen_libfunc, but verify that FP or INT or signed FIXED operation is
5666    involved.  */
5667
5668 void
5669 gen_int_fp_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5670                                  enum machine_mode mode)
5671 {
5672   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5673     gen_fp_libfunc (optable, name, suffix, mode);
5674   if (INTEGRAL_MODE_P (mode))
5675     gen_int_libfunc (optable, name, suffix, mode);
5676   if (SIGNED_FIXED_POINT_MODE_P (mode))
5677     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5678 }
5679
5680 /* Like gen_libfunc, but verify that INT or FIXED operation is
5681    involved.  */
5682
5683 void
5684 gen_int_fixed_libfunc (optab optable, const char *name, char suffix,
5685                        enum machine_mode mode)
5686 {
5687   if (INTEGRAL_MODE_P (mode))
5688     gen_int_libfunc (optable, name, suffix, mode);
5689   if (ALL_FIXED_POINT_MODE_P (mode))
5690     gen_fixed_libfunc (optable, name, suffix, mode);
5691 }
5692
5693 /* Like gen_libfunc, but verify that INT or signed FIXED operation is
5694    involved.  */
5695
5696 void
5697 gen_int_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5698                               enum machine_mode mode)
5699 {
5700   if (INTEGRAL_MODE_P (mode))
5701     gen_int_libfunc (optable, name, suffix, mode);
5702   if (SIGNED_FIXED_POINT_MODE_P (mode))
5703     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5704 }
5705
5706 /* Like gen_libfunc, but verify that INT or unsigned FIXED operation is
5707    involved.  */
5708
5709 void
5710 gen_int_unsigned_fixed_libfunc (optab optable, const char *name, char suffix,
5711                                 enum machine_mode mode)
5712 {
5713   if (INTEGRAL_MODE_P (mode))
5714     gen_int_libfunc (optable, name, suffix, mode);
5715   if (UNSIGNED_FIXED_POINT_MODE_P (mode))
5716     gen_unsigned_fixed_libfunc (optable, name, suffix, mode);
5717 }
5718
5719 /* Initialize the libfunc fields of an entire group of entries of an
5720    inter-mode-class conversion optab.  The string formation rules are
5721    similar to the ones for init_libfuncs, above, but instead of having
5722    a mode name and an operand count these functions have two mode names
5723    and no operand count.  */
5724
5725 void
5726 gen_interclass_conv_libfunc (convert_optab tab,
5727                              const char *opname,
5728                              enum machine_mode tmode,
5729                              enum machine_mode fmode)
5730 {
5731   size_t opname_len = strlen (opname);
5732   size_t mname_len = 0;
5733
5734   const char *fname, *tname;
5735   const char *q;
5736   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5737   char *libfunc_name, *suffix;
5738   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5739   char *p;
5740
5741   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5742      depends on which underlying decimal floating point format is used.  */
5743   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5744
5745   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5746
5747   nondec_name = XALLOCAVEC (char, prefix_len + opname_len + mname_len + 1 + 1);
5748   nondec_name[0] = '_';
5749   nondec_name[1] = '_';
5750   if (targetm.libfunc_gnu_prefix)
5751     {
5752       nondec_name[2] = 'g';
5753       nondec_name[3] = 'n';
5754       nondec_name[4] = 'u';
5755       nondec_name[5] = '_';
5756     }
5757
5758   memcpy (&nondec_name[prefix_len], opname, opname_len);
5759   nondec_suffix = nondec_name + opname_len + prefix_len;
5760
5761   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5762   dec_name[0] = '_';
5763   dec_name[1] = '_';
5764   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5765   memcpy (&dec_name[2+dec_len], opname, opname_len);
5766   dec_suffix = dec_name + dec_len + opname_len + 2;
5767
5768   fname = GET_MODE_NAME (fmode);
5769   tname = GET_MODE_NAME (tmode);
5770
5771   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5772     {
5773       libfunc_name = dec_name;
5774       suffix = dec_suffix;
5775     }
5776   else
5777     {
5778       libfunc_name = nondec_name;
5779       suffix = nondec_suffix;
5780     }
5781
5782   p = suffix;
5783   for (q = fname; *q; p++, q++)
5784     *p = TOLOWER (*q);
5785   for (q = tname; *q; p++, q++)
5786     *p = TOLOWER (*q);
5787
5788   *p = '\0';
5789
5790   set_conv_libfunc (tab, tmode, fmode,
5791                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5792 }
5793
5794 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5795    int->fp conversion.  */
5796
5797 void
5798 gen_int_to_fp_conv_libfunc (convert_optab tab,
5799                             const char *opname,
5800                             enum machine_mode tmode,
5801                             enum machine_mode fmode)
5802 {
5803   if (GET_MODE_CLASS (fmode) != MODE_INT)
5804     return;
5805   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5806     return;
5807   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5808 }
5809
5810 /* ufloat_optab is special by using floatun for FP and floatuns decimal fp
5811    naming scheme.  */
5812
5813 void
5814 gen_ufloat_conv_libfunc (convert_optab tab,
5815                          const char *opname ATTRIBUTE_UNUSED,
5816                          enum machine_mode tmode,
5817                          enum machine_mode fmode)
5818 {
5819   if (DECIMAL_FLOAT_MODE_P (tmode))
5820     gen_int_to_fp_conv_libfunc (tab, "floatuns", tmode, fmode);
5821   else
5822     gen_int_to_fp_conv_libfunc (tab, "floatun", tmode, fmode);
5823 }
5824
5825 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5826    fp->int conversion.  */
5827
5828 void
5829 gen_int_to_fp_nondecimal_conv_libfunc (convert_optab tab,
5830                                        const char *opname,
5831                                        enum machine_mode tmode,
5832                                        enum machine_mode fmode)
5833 {
5834   if (GET_MODE_CLASS (fmode) != MODE_INT)
5835     return;
5836   if (GET_MODE_CLASS (tmode) != MODE_FLOAT)
5837     return;
5838   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5839 }
5840
5841 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5842    fp->int conversion with no decimal floating point involved.  */
5843
5844 void
5845 gen_fp_to_int_conv_libfunc (convert_optab tab,
5846                             const char *opname,
5847                             enum machine_mode tmode,
5848                             enum machine_mode fmode)
5849 {
5850   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5851     return;
5852   if (GET_MODE_CLASS (tmode) != MODE_INT)
5853     return;
5854   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5855 }
5856
5857 /* Initialize the libfunc fields of an of an intra-mode-class conversion optab.
5858    The string formation rules are
5859    similar to the ones for init_libfunc, above.  */
5860
5861 void
5862 gen_intraclass_conv_libfunc (convert_optab tab, const char *opname,
5863                              enum machine_mode tmode, enum machine_mode fmode)
5864 {
5865   size_t opname_len = strlen (opname);
5866   size_t mname_len = 0;
5867
5868   const char *fname, *tname;
5869   const char *q;
5870   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5871   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5872   char *libfunc_name, *suffix;
5873   char *p;
5874
5875   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5876      depends on which underlying decimal floating point format is used.  */
5877   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5878
5879   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5880
5881   nondec_name = XALLOCAVEC (char, 2 + opname_len + mname_len + 1 + 1);
5882   nondec_name[0] = '_';
5883   nondec_name[1] = '_';
5884   if (targetm.libfunc_gnu_prefix)
5885     {
5886       nondec_name[2] = 'g';
5887       nondec_name[3] = 'n';
5888       nondec_name[4] = 'u';
5889       nondec_name[5] = '_';
5890     }
5891   memcpy (&nondec_name[prefix_len], opname, opname_len);
5892   nondec_suffix = nondec_name + opname_len + prefix_len;
5893
5894   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5895   dec_name[0] = '_';
5896   dec_name[1] = '_';
5897   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5898   memcpy (&dec_name[2 + dec_len], opname, opname_len);
5899   dec_suffix = dec_name + dec_len + opname_len + 2;
5900
5901   fname = GET_MODE_NAME (fmode);
5902   tname = GET_MODE_NAME (tmode);
5903
5904   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5905     {
5906       libfunc_name = dec_name;
5907       suffix = dec_suffix;
5908     }
5909   else
5910     {
5911       libfunc_name = nondec_name;
5912       suffix = nondec_suffix;
5913     }
5914
5915   p = suffix;
5916   for (q = fname; *q; p++, q++)
5917     *p = TOLOWER (*q);
5918   for (q = tname; *q; p++, q++)
5919     *p = TOLOWER (*q);
5920
5921   *p++ = '2';
5922   *p = '\0';
5923
5924   set_conv_libfunc (tab, tmode, fmode,
5925                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5926 }
5927
5928 /* Pick proper libcall for trunc_optab.  We need to chose if we do
5929    truncation or extension and interclass or intraclass.  */
5930
5931 void
5932 gen_trunc_conv_libfunc (convert_optab tab,
5933                          const char *opname,
5934                          enum machine_mode tmode,
5935                          enum machine_mode fmode)
5936 {
5937   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5938     return;
5939   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5940     return;
5941   if (tmode == fmode)
5942     return;
5943
5944   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5945       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5946      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5947
5948   if (GET_MODE_PRECISION (fmode) <= GET_MODE_PRECISION (tmode))
5949     return;
5950
5951   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5952        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5953       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5954     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5955 }
5956
5957 /* Pick proper libcall for extend_optab.  We need to chose if we do
5958    truncation or extension and interclass or intraclass.  */
5959
5960 void
5961 gen_extend_conv_libfunc (convert_optab tab,
5962                          const char *opname ATTRIBUTE_UNUSED,
5963                          enum machine_mode tmode,
5964                          enum machine_mode fmode)
5965 {
5966   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5967     return;
5968   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5969     return;
5970   if (tmode == fmode)
5971     return;
5972
5973   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5974       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5975      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5976
5977   if (GET_MODE_PRECISION (fmode) > GET_MODE_PRECISION (tmode))
5978     return;
5979
5980   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5981        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5982       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5983     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5984 }
5985
5986 /* Pick proper libcall for fract_optab.  We need to chose if we do
5987    interclass or intraclass.  */
5988
5989 void
5990 gen_fract_conv_libfunc (convert_optab tab,
5991                         const char *opname,
5992                         enum machine_mode tmode,
5993                         enum machine_mode fmode)
5994 {
5995   if (tmode == fmode)
5996     return;
5997   if (!(ALL_FIXED_POINT_MODE_P (tmode) || ALL_FIXED_POINT_MODE_P (fmode)))
5998     return;
5999
6000   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6001     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6002   else
6003     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6004 }
6005
6006 /* Pick proper libcall for fractuns_optab.  */
6007
6008 void
6009 gen_fractuns_conv_libfunc (convert_optab tab,
6010                            const char *opname,
6011                            enum machine_mode tmode,
6012                            enum machine_mode fmode)
6013 {
6014   if (tmode == fmode)
6015     return;
6016   /* One mode must be a fixed-point mode, and the other must be an integer
6017      mode. */
6018   if (!((ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT)
6019         || (ALL_FIXED_POINT_MODE_P (fmode)
6020             && GET_MODE_CLASS (tmode) == MODE_INT)))
6021     return;
6022
6023   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6024 }
6025
6026 /* Pick proper libcall for satfract_optab.  We need to chose if we do
6027    interclass or intraclass.  */
6028
6029 void
6030 gen_satfract_conv_libfunc (convert_optab tab,
6031                            const char *opname,
6032                            enum machine_mode tmode,
6033                            enum machine_mode fmode)
6034 {
6035   if (tmode == fmode)
6036     return;
6037   /* TMODE must be a fixed-point mode.  */
6038   if (!ALL_FIXED_POINT_MODE_P (tmode))
6039     return;
6040
6041   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6042     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6043   else
6044     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6045 }
6046
6047 /* Pick proper libcall for satfractuns_optab.  */
6048
6049 void
6050 gen_satfractuns_conv_libfunc (convert_optab tab,
6051                               const char *opname,
6052                               enum machine_mode tmode,
6053                               enum machine_mode fmode)
6054 {
6055   if (tmode == fmode)
6056     return;
6057   /* TMODE must be a fixed-point mode, and FMODE must be an integer mode. */
6058   if (!(ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT))
6059     return;
6060
6061   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6062 }
6063
6064 /* A table of previously-created libfuncs, hashed by name.  */
6065 static GTY ((param_is (union tree_node))) htab_t libfunc_decls;
6066
6067 /* Hashtable callbacks for libfunc_decls.  */
6068
6069 static hashval_t
6070 libfunc_decl_hash (const void *entry)
6071 {
6072   return IDENTIFIER_HASH_VALUE (DECL_NAME ((const_tree) entry));
6073 }
6074
6075 static int
6076 libfunc_decl_eq (const void *entry1, const void *entry2)
6077 {
6078   return DECL_NAME ((const_tree) entry1) == (const_tree) entry2;
6079 }
6080
6081 /* Build a decl for a libfunc named NAME. */
6082
6083 tree
6084 build_libfunc_function (const char *name)
6085 {
6086   tree decl = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL,
6087                           get_identifier (name),
6088                           build_function_type (integer_type_node, NULL_TREE));
6089   /* ??? We don't have any type information except for this is
6090      a function.  Pretend this is "int foo()".  */
6091   DECL_ARTIFICIAL (decl) = 1;
6092   DECL_EXTERNAL (decl) = 1;
6093   TREE_PUBLIC (decl) = 1;
6094   gcc_assert (DECL_ASSEMBLER_NAME (decl));
6095
6096   /* Zap the nonsensical SYMBOL_REF_DECL for this.  What we're left with
6097      are the flags assigned by targetm.encode_section_info.  */
6098   SET_SYMBOL_REF_DECL (XEXP (DECL_RTL (decl), 0), NULL);
6099
6100   return decl;
6101 }
6102
6103 rtx
6104 init_one_libfunc (const char *name)
6105 {
6106   tree id, decl;
6107   void **slot;
6108   hashval_t hash;
6109
6110   if (libfunc_decls == NULL)
6111     libfunc_decls = htab_create_ggc (37, libfunc_decl_hash,
6112                                      libfunc_decl_eq, NULL);
6113
6114   /* See if we have already created a libfunc decl for this function.  */
6115   id = get_identifier (name);
6116   hash = IDENTIFIER_HASH_VALUE (id);
6117   slot = htab_find_slot_with_hash (libfunc_decls, id, hash, INSERT);
6118   decl = (tree) *slot;
6119   if (decl == NULL)
6120     {
6121       /* Create a new decl, so that it can be passed to
6122          targetm.encode_section_info.  */
6123       decl = build_libfunc_function (name);
6124       *slot = decl;
6125     }
6126   return XEXP (DECL_RTL (decl), 0);
6127 }
6128
6129 /* Adjust the assembler name of libfunc NAME to ASMSPEC.  */
6130
6131 rtx
6132 set_user_assembler_libfunc (const char *name, const char *asmspec)
6133 {
6134   tree id, decl;
6135   void **slot;
6136   hashval_t hash;
6137
6138   id = get_identifier (name);
6139   hash = IDENTIFIER_HASH_VALUE (id);
6140   slot = htab_find_slot_with_hash (libfunc_decls, id, hash, NO_INSERT);
6141   gcc_assert (slot);
6142   decl = (tree) *slot;
6143   set_user_assembler_name (decl, asmspec);
6144   return XEXP (DECL_RTL (decl), 0);
6145 }
6146
6147 /* Call this to reset the function entry for one optab (OPTABLE) in mode
6148    MODE to NAME, which should be either 0 or a string constant.  */
6149 void
6150 set_optab_libfunc (optab op, enum machine_mode mode, const char *name)
6151 {
6152   rtx val;
6153   struct libfunc_entry e;
6154   struct libfunc_entry **slot;
6155
6156   e.op = op;
6157   e.mode1 = mode;
6158   e.mode2 = VOIDmode;
6159
6160   if (name)
6161     val = init_one_libfunc (name);
6162   else
6163     val = 0;
6164   slot = (struct libfunc_entry **) htab_find_slot (libfunc_hash, &e, INSERT);
6165   if (*slot == NULL)
6166     *slot = ggc_alloc_libfunc_entry ();
6167   (*slot)->op = op;
6168   (*slot)->mode1 = mode;
6169   (*slot)->mode2 = VOIDmode;
6170   (*slot)->libfunc = val;
6171 }
6172
6173 /* Call this to reset the function entry for one conversion optab
6174    (OPTABLE) from mode FMODE to mode TMODE to NAME, which should be
6175    either 0 or a string constant.  */
6176 void
6177 set_conv_libfunc (convert_optab optab, enum machine_mode tmode,
6178                   enum machine_mode fmode, const char *name)
6179 {
6180   rtx val;
6181   struct libfunc_entry e;
6182   struct libfunc_entry **slot;
6183
6184   e.op = optab;
6185   e.mode1 = tmode;
6186   e.mode2 = fmode;
6187
6188   if (name)
6189     val = init_one_libfunc (name);
6190   else
6191     val = 0;
6192   slot = (struct libfunc_entry **) htab_find_slot (libfunc_hash, &e, INSERT);
6193   if (*slot == NULL)
6194     *slot = ggc_alloc_libfunc_entry ();
6195   (*slot)->op = optab;
6196   (*slot)->mode1 = tmode;
6197   (*slot)->mode2 = fmode;
6198   (*slot)->libfunc = val;
6199 }
6200
6201 /* Call this to initialize the contents of the optabs
6202    appropriately for the current target machine.  */
6203
6204 void
6205 init_optabs (void)
6206 {
6207   if (libfunc_hash)
6208     htab_empty (libfunc_hash);
6209   else
6210     libfunc_hash = htab_create_ggc (10, hash_libfunc, eq_libfunc, NULL);
6211
6212   /* Fill in the optabs with the insns we support.  */
6213   init_all_optabs (this_fn_optabs);
6214
6215   /* The ffs function operates on `int'.  Fall back on it if we do not
6216      have a libgcc2 function for that width.  */
6217   if (INT_TYPE_SIZE < BITS_PER_WORD)
6218     set_optab_libfunc (ffs_optab, mode_for_size (INT_TYPE_SIZE, MODE_INT, 0),
6219                        "ffs");
6220
6221   /* Explicitly initialize the bswap libfuncs since we need them to be
6222      valid for things other than word_mode.  */
6223   if (targetm.libfunc_gnu_prefix)
6224     {
6225       set_optab_libfunc (bswap_optab, SImode, "__gnu_bswapsi2");
6226       set_optab_libfunc (bswap_optab, DImode, "__gnu_bswapdi2");
6227     }
6228   else
6229     {
6230       set_optab_libfunc (bswap_optab, SImode, "__bswapsi2");
6231       set_optab_libfunc (bswap_optab, DImode, "__bswapdi2");
6232     }
6233
6234   /* Use cabs for double complex abs, since systems generally have cabs.
6235      Don't define any libcall for float complex, so that cabs will be used.  */
6236   if (complex_double_type_node)
6237     set_optab_libfunc (abs_optab, TYPE_MODE (complex_double_type_node),
6238                        "cabs");
6239
6240   abort_libfunc = init_one_libfunc ("abort");
6241   memcpy_libfunc = init_one_libfunc ("memcpy");
6242   memmove_libfunc = init_one_libfunc ("memmove");
6243   memcmp_libfunc = init_one_libfunc ("memcmp");
6244   memset_libfunc = init_one_libfunc ("memset");
6245   setbits_libfunc = init_one_libfunc ("__setbits");
6246
6247 #ifndef DONT_USE_BUILTIN_SETJMP
6248   setjmp_libfunc = init_one_libfunc ("__builtin_setjmp");
6249   longjmp_libfunc = init_one_libfunc ("__builtin_longjmp");
6250 #else
6251   setjmp_libfunc = init_one_libfunc ("setjmp");
6252   longjmp_libfunc = init_one_libfunc ("longjmp");
6253 #endif
6254   unwind_sjlj_register_libfunc = init_one_libfunc ("_Unwind_SjLj_Register");
6255   unwind_sjlj_unregister_libfunc
6256     = init_one_libfunc ("_Unwind_SjLj_Unregister");
6257
6258   /* For function entry/exit instrumentation.  */
6259   profile_function_entry_libfunc
6260     = init_one_libfunc ("__cyg_profile_func_enter");
6261   profile_function_exit_libfunc
6262     = init_one_libfunc ("__cyg_profile_func_exit");
6263
6264   gcov_flush_libfunc = init_one_libfunc ("__gcov_flush");
6265
6266   /* Allow the target to add more libcalls or rename some, etc.  */
6267   targetm.init_libfuncs ();
6268 }
6269
6270 /* Use the current target and options to initialize
6271    TREE_OPTIMIZATION_OPTABS (OPTNODE).  */
6272
6273 void
6274 init_tree_optimization_optabs (tree optnode)
6275 {
6276   /* Quick exit if we have already computed optabs for this target.  */
6277   if (TREE_OPTIMIZATION_BASE_OPTABS (optnode) == this_target_optabs)
6278     return;
6279
6280   /* Forget any previous information and set up for the current target.  */
6281   TREE_OPTIMIZATION_BASE_OPTABS (optnode) = this_target_optabs;
6282   struct target_optabs *tmp_optabs = (struct target_optabs *)
6283     TREE_OPTIMIZATION_OPTABS (optnode);
6284   if (tmp_optabs)
6285     memset (tmp_optabs, 0, sizeof (struct target_optabs));
6286   else
6287     tmp_optabs = (struct target_optabs *)
6288       ggc_alloc_atomic (sizeof (struct target_optabs));
6289
6290   /* Generate a new set of optabs into tmp_optabs.  */
6291   init_all_optabs (tmp_optabs);
6292
6293   /* If the optabs changed, record it.  */
6294   if (memcmp (tmp_optabs, this_target_optabs, sizeof (struct target_optabs)))
6295     TREE_OPTIMIZATION_OPTABS (optnode) = tmp_optabs;
6296   else
6297     {
6298       TREE_OPTIMIZATION_OPTABS (optnode) = NULL;
6299       ggc_free (tmp_optabs);
6300     }
6301 }
6302
6303 /* A helper function for init_sync_libfuncs.  Using the basename BASE,
6304    install libfuncs into TAB for BASE_N for 1 <= N <= MAX.  */
6305
6306 static void
6307 init_sync_libfuncs_1 (optab tab, const char *base, int max)
6308 {
6309   enum machine_mode mode;
6310   char buf[64];
6311   size_t len = strlen (base);
6312   int i;
6313
6314   gcc_assert (max <= 8);
6315   gcc_assert (len + 3 < sizeof (buf));
6316
6317   memcpy (buf, base, len);
6318   buf[len] = '_';
6319   buf[len + 1] = '0';
6320   buf[len + 2] = '\0';
6321
6322   mode = QImode;
6323   for (i = 1; i <= max; i *= 2)
6324     {
6325       buf[len + 1] = '0' + i;
6326       set_optab_libfunc (tab, mode, buf);
6327       mode = GET_MODE_2XWIDER_MODE (mode);
6328     }
6329 }
6330
6331 void
6332 init_sync_libfuncs (int max)
6333 {
6334   if (!flag_sync_libcalls)
6335     return;
6336
6337   init_sync_libfuncs_1 (sync_compare_and_swap_optab,
6338                         "__sync_val_compare_and_swap", max);
6339   init_sync_libfuncs_1 (sync_lock_test_and_set_optab,
6340                         "__sync_lock_test_and_set", max);
6341
6342   init_sync_libfuncs_1 (sync_old_add_optab, "__sync_fetch_and_add", max);
6343   init_sync_libfuncs_1 (sync_old_sub_optab, "__sync_fetch_and_sub", max);
6344   init_sync_libfuncs_1 (sync_old_ior_optab, "__sync_fetch_and_or", max);
6345   init_sync_libfuncs_1 (sync_old_and_optab, "__sync_fetch_and_and", max);
6346   init_sync_libfuncs_1 (sync_old_xor_optab, "__sync_fetch_and_xor", max);
6347   init_sync_libfuncs_1 (sync_old_nand_optab, "__sync_fetch_and_nand", max);
6348
6349   init_sync_libfuncs_1 (sync_new_add_optab, "__sync_add_and_fetch", max);
6350   init_sync_libfuncs_1 (sync_new_sub_optab, "__sync_sub_and_fetch", max);
6351   init_sync_libfuncs_1 (sync_new_ior_optab, "__sync_or_and_fetch", max);
6352   init_sync_libfuncs_1 (sync_new_and_optab, "__sync_and_and_fetch", max);
6353   init_sync_libfuncs_1 (sync_new_xor_optab, "__sync_xor_and_fetch", max);
6354   init_sync_libfuncs_1 (sync_new_nand_optab, "__sync_nand_and_fetch", max);
6355 }
6356
6357 /* Print information about the current contents of the optabs on
6358    STDERR.  */
6359
6360 DEBUG_FUNCTION void
6361 debug_optab_libfuncs (void)
6362 {
6363   int i, j, k;
6364
6365   /* Dump the arithmetic optabs.  */
6366   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
6367     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6368       {
6369         rtx l = optab_libfunc ((optab) i, (enum machine_mode) j);
6370         if (l)
6371           {
6372             gcc_assert (GET_CODE (l) == SYMBOL_REF);
6373             fprintf (stderr, "%s\t%s:\t%s\n",
6374                      GET_RTX_NAME (optab_to_code ((optab) i)),
6375                      GET_MODE_NAME (j),
6376                      XSTR (l, 0));
6377           }
6378       }
6379
6380   /* Dump the conversion optabs.  */
6381   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
6382     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6383       for (k = 0; k < NUM_MACHINE_MODES; ++k)
6384         {
6385           rtx l = convert_optab_libfunc ((optab) i, (enum machine_mode) j,
6386                                          (enum machine_mode) k);
6387           if (l)
6388             {
6389               gcc_assert (GET_CODE (l) == SYMBOL_REF);
6390               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
6391                        GET_RTX_NAME (optab_to_code ((optab) i)),
6392                        GET_MODE_NAME (j),
6393                        GET_MODE_NAME (k),
6394                        XSTR (l, 0));
6395             }
6396         }
6397 }
6398
6399 \f
6400 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
6401    CODE.  Return 0 on failure.  */
6402
6403 rtx
6404 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
6405 {
6406   enum machine_mode mode = GET_MODE (op1);
6407   enum insn_code icode;
6408   rtx insn;
6409   rtx trap_rtx;
6410
6411   if (mode == VOIDmode)
6412     return 0;
6413
6414   icode = optab_handler (ctrap_optab, mode);
6415   if (icode == CODE_FOR_nothing)
6416     return 0;
6417
6418   /* Some targets only accept a zero trap code.  */
6419   if (!insn_operand_matches (icode, 3, tcode))
6420     return 0;
6421
6422   do_pending_stack_adjust ();
6423   start_sequence ();
6424   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
6425                     &trap_rtx, &mode);
6426   if (!trap_rtx)
6427     insn = NULL_RTX;
6428   else
6429     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
6430                             tcode);
6431
6432   /* If that failed, then give up.  */
6433   if (insn == 0)
6434     {
6435       end_sequence ();
6436       return 0;
6437     }
6438
6439   emit_insn (insn);
6440   insn = get_insns ();
6441   end_sequence ();
6442   return insn;
6443 }
6444
6445 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
6446    or unsigned operation code.  */
6447
6448 static enum rtx_code
6449 get_rtx_code (enum tree_code tcode, bool unsignedp)
6450 {
6451   enum rtx_code code;
6452   switch (tcode)
6453     {
6454     case EQ_EXPR:
6455       code = EQ;
6456       break;
6457     case NE_EXPR:
6458       code = NE;
6459       break;
6460     case LT_EXPR:
6461       code = unsignedp ? LTU : LT;
6462       break;
6463     case LE_EXPR:
6464       code = unsignedp ? LEU : LE;
6465       break;
6466     case GT_EXPR:
6467       code = unsignedp ? GTU : GT;
6468       break;
6469     case GE_EXPR:
6470       code = unsignedp ? GEU : GE;
6471       break;
6472
6473     case UNORDERED_EXPR:
6474       code = UNORDERED;
6475       break;
6476     case ORDERED_EXPR:
6477       code = ORDERED;
6478       break;
6479     case UNLT_EXPR:
6480       code = UNLT;
6481       break;
6482     case UNLE_EXPR:
6483       code = UNLE;
6484       break;
6485     case UNGT_EXPR:
6486       code = UNGT;
6487       break;
6488     case UNGE_EXPR:
6489       code = UNGE;
6490       break;
6491     case UNEQ_EXPR:
6492       code = UNEQ;
6493       break;
6494     case LTGT_EXPR:
6495       code = LTGT;
6496       break;
6497
6498     default:
6499       gcc_unreachable ();
6500     }
6501   return code;
6502 }
6503
6504 /* Return comparison rtx for COND. Use UNSIGNEDP to select signed or
6505    unsigned operators. Do not generate compare instruction.  */
6506
6507 static rtx
6508 vector_compare_rtx (enum tree_code tcode, tree t_op0, tree t_op1,
6509                     bool unsignedp, enum insn_code icode)
6510 {
6511   struct expand_operand ops[2];
6512   rtx rtx_op0, rtx_op1;
6513   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
6514
6515   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
6516
6517   /* Expand operands.  */
6518   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
6519                          EXPAND_STACK_PARM);
6520   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
6521                          EXPAND_STACK_PARM);
6522
6523   create_input_operand (&ops[0], rtx_op0, GET_MODE (rtx_op0));
6524   create_input_operand (&ops[1], rtx_op1, GET_MODE (rtx_op1));
6525   if (!maybe_legitimize_operands (icode, 4, 2, ops))
6526     gcc_unreachable ();
6527   return gen_rtx_fmt_ee (rcode, VOIDmode, ops[0].value, ops[1].value);
6528 }
6529
6530 /* Return true if VEC_PERM_EXPR can be expanded using SIMD extensions
6531    of the CPU.  SEL may be NULL, which stands for an unknown constant.  */
6532
6533 bool
6534 can_vec_perm_p (enum machine_mode mode, bool variable,
6535                 const unsigned char *sel)
6536 {
6537   enum machine_mode qimode;
6538
6539   /* If the target doesn't implement a vector mode for the vector type,
6540      then no operations are supported.  */
6541   if (!VECTOR_MODE_P (mode))
6542     return false;
6543
6544   if (!variable)
6545     {
6546       if (direct_optab_handler (vec_perm_const_optab, mode) != CODE_FOR_nothing
6547           && (sel == NULL
6548               || targetm.vectorize.vec_perm_const_ok == NULL
6549               || targetm.vectorize.vec_perm_const_ok (mode, sel)))
6550         return true;
6551     }
6552
6553   if (direct_optab_handler (vec_perm_optab, mode) != CODE_FOR_nothing)
6554     return true;
6555
6556   /* We allow fallback to a QI vector mode, and adjust the mask.  */
6557   if (GET_MODE_INNER (mode) == QImode)
6558     return false;
6559   qimode = mode_for_vector (QImode, GET_MODE_SIZE (mode));
6560   if (!VECTOR_MODE_P (qimode))
6561     return false;
6562
6563   /* ??? For completeness, we ought to check the QImode version of
6564       vec_perm_const_optab.  But all users of this implicit lowering
6565       feature implement the variable vec_perm_optab.  */
6566   if (direct_optab_handler (vec_perm_optab, qimode) == CODE_FOR_nothing)
6567     return false;
6568
6569   /* In order to support the lowering of variable permutations,
6570      we need to support shifts and adds.  */
6571   if (variable)
6572     {
6573       if (GET_MODE_UNIT_SIZE (mode) > 2
6574           && optab_handler (ashl_optab, mode) == CODE_FOR_nothing
6575           && optab_handler (vashl_optab, mode) == CODE_FOR_nothing)
6576         return false;
6577       if (optab_handler (add_optab, qimode) == CODE_FOR_nothing)
6578         return false;
6579     }
6580
6581   return true;
6582 }
6583
6584 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
6585
6586 static rtx
6587 expand_vec_perm_1 (enum insn_code icode, rtx target,
6588                    rtx v0, rtx v1, rtx sel)
6589 {
6590   enum machine_mode tmode = GET_MODE (target);
6591   enum machine_mode smode = GET_MODE (sel);
6592   struct expand_operand ops[4];
6593
6594   create_output_operand (&ops[0], target, tmode);
6595   create_input_operand (&ops[3], sel, smode);
6596
6597   /* Make an effort to preserve v0 == v1.  The target expander is able to
6598      rely on this to determine if we're permuting a single input operand.  */
6599   if (rtx_equal_p (v0, v1))
6600     {
6601       if (!insn_operand_matches (icode, 1, v0))
6602         v0 = force_reg (tmode, v0);
6603       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
6604       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
6605
6606       create_fixed_operand (&ops[1], v0);
6607       create_fixed_operand (&ops[2], v0);
6608     }
6609   else
6610     {
6611       create_input_operand (&ops[1], v0, tmode);
6612       create_input_operand (&ops[2], v1, tmode);
6613     }
6614
6615   if (maybe_expand_insn (icode, 4, ops))
6616     return ops[0].value;
6617   return NULL_RTX;
6618 }
6619
6620 /* Generate instructions for vec_perm optab given its mode
6621    and three operands.  */
6622
6623 rtx
6624 expand_vec_perm (enum machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
6625 {
6626   enum insn_code icode;
6627   enum machine_mode qimode;
6628   unsigned int i, w, e, u;
6629   rtx tmp, sel_qi = NULL;
6630   rtvec vec;
6631
6632   if (!target || GET_MODE (target) != mode)
6633     target = gen_reg_rtx (mode);
6634
6635   w = GET_MODE_SIZE (mode);
6636   e = GET_MODE_NUNITS (mode);
6637   u = GET_MODE_UNIT_SIZE (mode);
6638
6639   /* Set QIMODE to a different vector mode with byte elements.
6640      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
6641   qimode = VOIDmode;
6642   if (GET_MODE_INNER (mode) != QImode)
6643     {
6644       qimode = mode_for_vector (QImode, w);
6645       if (!VECTOR_MODE_P (qimode))
6646         qimode = VOIDmode;
6647     }
6648
6649   /* If the input is a constant, expand it specially.  */
6650   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
6651   if (GET_CODE (sel) == CONST_VECTOR)
6652     {
6653       icode = direct_optab_handler (vec_perm_const_optab, mode);
6654       if (icode != CODE_FOR_nothing)
6655         {
6656           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6657           if (tmp)
6658             return tmp;
6659         }
6660
6661       /* Fall back to a constant byte-based permutation.  */
6662       if (qimode != VOIDmode)
6663         {
6664           vec = rtvec_alloc (w);
6665           for (i = 0; i < e; ++i)
6666             {
6667               unsigned int j, this_e;
6668
6669               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
6670               this_e &= 2 * e - 1;
6671               this_e *= u;
6672
6673               for (j = 0; j < u; ++j)
6674                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
6675             }
6676           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
6677
6678           icode = direct_optab_handler (vec_perm_const_optab, qimode);
6679           if (icode != CODE_FOR_nothing)
6680             {
6681               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6682               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6683                                        gen_lowpart (qimode, v1), sel_qi);
6684               if (tmp)
6685                 return gen_lowpart (mode, tmp);
6686             }
6687         }
6688     }
6689
6690   /* Otherwise expand as a fully variable permuation.  */
6691   icode = direct_optab_handler (vec_perm_optab, mode);
6692   if (icode != CODE_FOR_nothing)
6693     {
6694       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6695       if (tmp)
6696         return tmp;
6697     }
6698
6699   /* As a special case to aid several targets, lower the element-based
6700      permutation to a byte-based permutation and try again.  */
6701   if (qimode == VOIDmode)
6702     return NULL_RTX;
6703   icode = direct_optab_handler (vec_perm_optab, qimode);
6704   if (icode == CODE_FOR_nothing)
6705     return NULL_RTX;
6706
6707   if (sel_qi == NULL)
6708     {
6709       /* Multiply each element by its byte size.  */
6710       enum machine_mode selmode = GET_MODE (sel);
6711       if (u == 2)
6712         sel = expand_simple_binop (selmode, PLUS, sel, sel,
6713                                    sel, 0, OPTAB_DIRECT);
6714       else
6715         sel = expand_simple_binop (selmode, ASHIFT, sel,
6716                                    GEN_INT (exact_log2 (u)),
6717                                    sel, 0, OPTAB_DIRECT);
6718       gcc_assert (sel != NULL);
6719
6720       /* Broadcast the low byte each element into each of its bytes.  */
6721       vec = rtvec_alloc (w);
6722       for (i = 0; i < w; ++i)
6723         {
6724           int this_e = i / u * u;
6725           if (BYTES_BIG_ENDIAN)
6726             this_e += u - 1;
6727           RTVEC_ELT (vec, i) = GEN_INT (this_e);
6728         }
6729       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6730       sel = gen_lowpart (qimode, sel);
6731       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
6732       gcc_assert (sel != NULL);
6733
6734       /* Add the byte offset to each byte element.  */
6735       /* Note that the definition of the indicies here is memory ordering,
6736          so there should be no difference between big and little endian.  */
6737       vec = rtvec_alloc (w);
6738       for (i = 0; i < w; ++i)
6739         RTVEC_ELT (vec, i) = GEN_INT (i % u);
6740       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6741       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
6742                                     sel, 0, OPTAB_DIRECT);
6743       gcc_assert (sel_qi != NULL);
6744     }
6745
6746   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6747   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6748                            gen_lowpart (qimode, v1), sel_qi);
6749   if (tmp)
6750     tmp = gen_lowpart (mode, tmp);
6751   return tmp;
6752 }
6753
6754 /* Return insn code for a conditional operator with a comparison in
6755    mode CMODE, unsigned if UNS is true, resulting in a value of mode VMODE.  */
6756
6757 static inline enum insn_code
6758 get_vcond_icode (enum machine_mode vmode, enum machine_mode cmode, bool uns)
6759 {
6760   enum insn_code icode = CODE_FOR_nothing;
6761   if (uns)
6762     icode = convert_optab_handler (vcondu_optab, vmode, cmode);
6763   else
6764     icode = convert_optab_handler (vcond_optab, vmode, cmode);
6765   return icode;
6766 }
6767
6768 /* Return TRUE iff, appropriate vector insns are available
6769    for vector cond expr with vector type VALUE_TYPE and a comparison
6770    with operand vector types in CMP_OP_TYPE.  */
6771
6772 bool
6773 expand_vec_cond_expr_p (tree value_type, tree cmp_op_type)
6774 {
6775   enum machine_mode value_mode = TYPE_MODE (value_type);
6776   enum machine_mode cmp_op_mode = TYPE_MODE (cmp_op_type);
6777   if (GET_MODE_SIZE (value_mode) != GET_MODE_SIZE (cmp_op_mode)
6778       || GET_MODE_NUNITS (value_mode) != GET_MODE_NUNITS (cmp_op_mode)
6779       || get_vcond_icode (TYPE_MODE (value_type), TYPE_MODE (cmp_op_type),
6780                           TYPE_UNSIGNED (cmp_op_type)) == CODE_FOR_nothing)
6781     return false;
6782   return true;
6783 }
6784
6785 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
6786    three operands.  */
6787
6788 rtx
6789 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
6790                       rtx target)
6791 {
6792   struct expand_operand ops[6];
6793   enum insn_code icode;
6794   rtx comparison, rtx_op1, rtx_op2;
6795   enum machine_mode mode = TYPE_MODE (vec_cond_type);
6796   enum machine_mode cmp_op_mode;
6797   bool unsignedp;
6798   tree op0a, op0b;
6799   enum tree_code tcode;
6800
6801   if (COMPARISON_CLASS_P (op0))
6802     {
6803       op0a = TREE_OPERAND (op0, 0);
6804       op0b = TREE_OPERAND (op0, 1);
6805       tcode = TREE_CODE (op0);
6806     }
6807   else
6808     {
6809       /* Fake op0 < 0.  */
6810       gcc_assert (!TYPE_UNSIGNED (TREE_TYPE (op0)));
6811       op0a = op0;
6812       op0b = build_zero_cst (TREE_TYPE (op0));
6813       tcode = LT_EXPR;
6814     }
6815   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
6816   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
6817
6818
6819   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
6820               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
6821
6822   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
6823   if (icode == CODE_FOR_nothing)
6824     return 0;
6825
6826   comparison = vector_compare_rtx (tcode, op0a, op0b, unsignedp, icode);
6827   rtx_op1 = expand_normal (op1);
6828   rtx_op2 = expand_normal (op2);
6829
6830   create_output_operand (&ops[0], target, mode);
6831   create_input_operand (&ops[1], rtx_op1, mode);
6832   create_input_operand (&ops[2], rtx_op2, mode);
6833   create_fixed_operand (&ops[3], comparison);
6834   create_fixed_operand (&ops[4], XEXP (comparison, 0));
6835   create_fixed_operand (&ops[5], XEXP (comparison, 1));
6836   expand_insn (icode, 6, ops);
6837   return ops[0].value;
6838 }
6839
6840 /* Return non-zero if a highpart multiply is supported of can be synthisized.
6841    For the benefit of expand_mult_highpart, the return value is 1 for direct,
6842    2 for even/odd widening, and 3 for hi/lo widening.  */
6843
6844 int
6845 can_mult_highpart_p (enum machine_mode mode, bool uns_p)
6846 {
6847   optab op;
6848   unsigned char *sel;
6849   unsigned i, nunits;
6850
6851   op = uns_p ? umul_highpart_optab : smul_highpart_optab;
6852   if (optab_handler (op, mode) != CODE_FOR_nothing)
6853     return 1;
6854
6855   /* If the mode is an integral vector, synth from widening operations.  */
6856   if (GET_MODE_CLASS (mode) != MODE_VECTOR_INT)
6857     return 0;
6858
6859   nunits = GET_MODE_NUNITS (mode);
6860   sel = XALLOCAVEC (unsigned char, nunits);
6861
6862   op = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6863   if (optab_handler (op, mode) != CODE_FOR_nothing)
6864     {
6865       op = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6866       if (optab_handler (op, mode) != CODE_FOR_nothing)
6867         {
6868           for (i = 0; i < nunits; ++i)
6869             sel[i] = !BYTES_BIG_ENDIAN + (i & ~1) + ((i & 1) ? nunits : 0);
6870           if (can_vec_perm_p (mode, false, sel))
6871             return 2;
6872         }
6873     }
6874
6875   op = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6876   if (optab_handler (op, mode) != CODE_FOR_nothing)
6877     {
6878       op = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6879       if (optab_handler (op, mode) != CODE_FOR_nothing)
6880         {
6881           for (i = 0; i < nunits; ++i)
6882             sel[i] = 2 * i + (BYTES_BIG_ENDIAN ? 0 : 1);
6883           if (can_vec_perm_p (mode, false, sel))
6884             return 3;
6885         }
6886     }
6887
6888   return 0;
6889 }
6890
6891 /* Expand a highpart multiply.  */
6892
6893 rtx
6894 expand_mult_highpart (enum machine_mode mode, rtx op0, rtx op1,
6895                       rtx target, bool uns_p)
6896 {
6897   struct expand_operand eops[3];
6898   enum insn_code icode;
6899   int method, i, nunits;
6900   enum machine_mode wmode;
6901   rtx m1, m2, perm;
6902   optab tab1, tab2;
6903   rtvec v;
6904
6905   method = can_mult_highpart_p (mode, uns_p);
6906   switch (method)
6907     {
6908     case 0:
6909       return NULL_RTX;
6910     case 1:
6911       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
6912       return expand_binop (mode, tab1, op0, op1, target, uns_p,
6913                            OPTAB_LIB_WIDEN);
6914     case 2:
6915       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6916       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6917       break;
6918     case 3:
6919       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6920       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6921       if (BYTES_BIG_ENDIAN)
6922         {
6923           optab t = tab1;
6924           tab1 = tab2;
6925           tab2 = t;
6926         }
6927       break;
6928     default:
6929       gcc_unreachable ();
6930     }
6931
6932   icode = optab_handler (tab1, mode);
6933   nunits = GET_MODE_NUNITS (mode);
6934   wmode = insn_data[icode].operand[0].mode;
6935   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
6936   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
6937
6938   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6939   create_input_operand (&eops[1], op0, mode);
6940   create_input_operand (&eops[2], op1, mode);
6941   expand_insn (icode, 3, eops);
6942   m1 = gen_lowpart (mode, eops[0].value);
6943
6944   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6945   create_input_operand (&eops[1], op0, mode);
6946   create_input_operand (&eops[2], op1, mode);
6947   expand_insn (optab_handler (tab2, mode), 3, eops);
6948   m2 = gen_lowpart (mode, eops[0].value);
6949
6950   v = rtvec_alloc (nunits);
6951   if (method == 2)
6952     {
6953       for (i = 0; i < nunits; ++i)
6954         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
6955                                     + ((i & 1) ? nunits : 0));
6956     }
6957   else
6958     {
6959       for (i = 0; i < nunits; ++i)
6960         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
6961     }
6962   perm = gen_rtx_CONST_VECTOR (mode, v);
6963
6964   return expand_vec_perm (mode, m1, m2, perm, target);
6965 }
6966
6967 /* Return true if target supports vector masked load/store for mode.  */
6968 bool
6969 can_vec_mask_load_store_p (enum machine_mode mode, bool is_load)
6970 {
6971   optab op = is_load ? maskload_optab : maskstore_optab;
6972   enum machine_mode vmode;
6973   unsigned int vector_sizes;
6974
6975   /* If mode is vector mode, check it directly.  */
6976   if (VECTOR_MODE_P (mode))
6977     return optab_handler (op, mode) != CODE_FOR_nothing;
6978
6979   /* Otherwise, return true if there is some vector mode with
6980      the mask load/store supported.  */
6981
6982   /* See if there is any chance the mask load or store might be
6983      vectorized.  If not, punt.  */
6984   vmode = targetm.vectorize.preferred_simd_mode (mode);
6985   if (!VECTOR_MODE_P (vmode))
6986     return false;
6987
6988   if (optab_handler (op, vmode) != CODE_FOR_nothing)
6989     return true;
6990
6991   vector_sizes = targetm.vectorize.autovectorize_vector_sizes ();
6992   while (vector_sizes != 0)
6993     {
6994       unsigned int cur = 1 << floor_log2 (vector_sizes);
6995       vector_sizes &= ~cur;
6996       if (cur <= GET_MODE_SIZE (mode))
6997         continue;
6998       vmode = mode_for_vector (mode, cur / GET_MODE_SIZE (mode));
6999       if (VECTOR_MODE_P (vmode)
7000           && optab_handler (op, vmode) != CODE_FOR_nothing)
7001         return true;
7002     }
7003   return false;
7004 }
7005 \f
7006 /* Return true if there is a compare_and_swap pattern.  */
7007
7008 bool
7009 can_compare_and_swap_p (enum machine_mode mode, bool allow_libcall)
7010 {
7011   enum insn_code icode;
7012
7013   /* Check for __atomic_compare_and_swap.  */
7014   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7015   if (icode != CODE_FOR_nothing)
7016     return true;
7017
7018   /* Check for __sync_compare_and_swap.  */
7019   icode = optab_handler (sync_compare_and_swap_optab, mode);
7020   if (icode != CODE_FOR_nothing)
7021     return true;
7022   if (allow_libcall && optab_libfunc (sync_compare_and_swap_optab, mode))
7023     return true;
7024
7025   /* No inline compare and swap.  */
7026   return false;
7027 }
7028
7029 /* Return true if an atomic exchange can be performed.  */
7030
7031 bool
7032 can_atomic_exchange_p (enum machine_mode mode, bool allow_libcall)
7033 {
7034   enum insn_code icode;
7035
7036   /* Check for __atomic_exchange.  */
7037   icode = direct_optab_handler (atomic_exchange_optab, mode);
7038   if (icode != CODE_FOR_nothing)
7039     return true;
7040
7041   /* Don't check __sync_test_and_set, as on some platforms that
7042      has reduced functionality.  Targets that really do support
7043      a proper exchange should simply be updated to the __atomics.  */
7044
7045   return can_compare_and_swap_p (mode, allow_libcall);
7046 }
7047
7048
7049 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
7050    pattern.  */
7051
7052 static void
7053 find_cc_set (rtx x, const_rtx pat, void *data)
7054 {
7055   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
7056       && GET_CODE (pat) == SET)
7057     {
7058       rtx *p_cc_reg = (rtx *) data;
7059       gcc_assert (!*p_cc_reg);
7060       *p_cc_reg = x;
7061     }
7062 }
7063
7064 /* This is a helper function for the other atomic operations.  This function
7065    emits a loop that contains SEQ that iterates until a compare-and-swap
7066    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
7067    a set of instructions that takes a value from OLD_REG as an input and
7068    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
7069    set to the current contents of MEM.  After SEQ, a compare-and-swap will
7070    attempt to update MEM with NEW_REG.  The function returns true when the
7071    loop was generated successfully.  */
7072
7073 static bool
7074 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
7075 {
7076   enum machine_mode mode = GET_MODE (mem);
7077   rtx label, cmp_reg, success, oldval;
7078
7079   /* The loop we want to generate looks like
7080
7081         cmp_reg = mem;
7082       label:
7083         old_reg = cmp_reg;
7084         seq;
7085         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
7086         if (success)
7087           goto label;
7088
7089      Note that we only do the plain load from memory once.  Subsequent
7090      iterations use the value loaded by the compare-and-swap pattern.  */
7091
7092   label = gen_label_rtx ();
7093   cmp_reg = gen_reg_rtx (mode);
7094
7095   emit_move_insn (cmp_reg, mem);
7096   emit_label (label);
7097   emit_move_insn (old_reg, cmp_reg);
7098   if (seq)
7099     emit_insn (seq);
7100
7101   success = NULL_RTX;
7102   oldval = cmp_reg;
7103   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
7104                                        new_reg, false, MEMMODEL_SEQ_CST,
7105                                        MEMMODEL_RELAXED))
7106     return false;
7107
7108   if (oldval != cmp_reg)
7109     emit_move_insn (cmp_reg, oldval);
7110
7111   /* Mark this jump predicted not taken.  */
7112   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
7113                            GET_MODE (success), 1, label, 0);
7114   return true;
7115 }
7116
7117
7118 /* This function tries to emit an atomic_exchange intruction.  VAL is written
7119    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
7120    using TARGET if possible.  */
7121
7122 static rtx
7123 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7124 {
7125   enum machine_mode mode = GET_MODE (mem);
7126   enum insn_code icode;
7127
7128   /* If the target supports the exchange directly, great.  */
7129   icode = direct_optab_handler (atomic_exchange_optab, mode);
7130   if (icode != CODE_FOR_nothing)
7131     {
7132       struct expand_operand ops[4];
7133
7134       create_output_operand (&ops[0], target, mode);
7135       create_fixed_operand (&ops[1], mem);
7136       create_input_operand (&ops[2], val, mode);
7137       create_integer_operand (&ops[3], model);
7138       if (maybe_expand_insn (icode, 4, ops))
7139         return ops[0].value;
7140     }
7141
7142   return NULL_RTX;
7143 }
7144
7145 /* This function tries to implement an atomic exchange operation using
7146    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
7147    The previous contents of *MEM are returned, using TARGET if possible.
7148    Since this instructionn is an acquire barrier only, stronger memory
7149    models may require additional barriers to be emitted.  */
7150
7151 static rtx
7152 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
7153                                    enum memmodel model)
7154 {
7155   enum machine_mode mode = GET_MODE (mem);
7156   enum insn_code icode;
7157   rtx last_insn = get_last_insn ();
7158
7159   icode = optab_handler (sync_lock_test_and_set_optab, mode);
7160
7161   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
7162      exists, and the memory model is stronger than acquire, add a release
7163      barrier before the instruction.  */
7164
7165   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST
7166       || (model & MEMMODEL_MASK) == MEMMODEL_RELEASE
7167       || (model & MEMMODEL_MASK) == MEMMODEL_ACQ_REL)
7168     expand_mem_thread_fence (model);
7169
7170   if (icode != CODE_FOR_nothing)
7171     {
7172       struct expand_operand ops[3];
7173       create_output_operand (&ops[0], target, mode);
7174       create_fixed_operand (&ops[1], mem);
7175       create_input_operand (&ops[2], val, mode);
7176       if (maybe_expand_insn (icode, 3, ops))
7177         return ops[0].value;
7178     }
7179
7180   /* If an external test-and-set libcall is provided, use that instead of
7181      any external compare-and-swap that we might get from the compare-and-
7182      swap-loop expansion later.  */
7183   if (!can_compare_and_swap_p (mode, false))
7184     {
7185       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
7186       if (libfunc != NULL)
7187         {
7188           rtx addr;
7189
7190           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7191           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7192                                           mode, 2, addr, ptr_mode,
7193                                           val, mode);
7194         }
7195     }
7196
7197   /* If the test_and_set can't be emitted, eliminate any barrier that might
7198      have been emitted.  */
7199   delete_insns_since (last_insn);
7200   return NULL_RTX;
7201 }
7202
7203 /* This function tries to implement an atomic exchange operation using a
7204    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
7205    *MEM are returned, using TARGET if possible.  No memory model is required
7206    since a compare_and_swap loop is seq-cst.  */
7207
7208 static rtx
7209 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
7210 {
7211   enum machine_mode mode = GET_MODE (mem);
7212
7213   if (can_compare_and_swap_p (mode, true))
7214     {
7215       if (!target || !register_operand (target, mode))
7216         target = gen_reg_rtx (mode);
7217       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
7218         return target;
7219     }
7220
7221   return NULL_RTX;
7222 }
7223
7224 /* This function tries to implement an atomic test-and-set operation
7225    using the atomic_test_and_set instruction pattern.  A boolean value
7226    is returned from the operation, using TARGET if possible.  */
7227
7228 #ifndef HAVE_atomic_test_and_set
7229 #define HAVE_atomic_test_and_set 0
7230 #define CODE_FOR_atomic_test_and_set CODE_FOR_nothing
7231 #endif
7232
7233 static rtx
7234 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7235 {
7236   enum machine_mode pat_bool_mode;
7237   struct expand_operand ops[3];
7238
7239   if (!HAVE_atomic_test_and_set)
7240     return NULL_RTX;
7241
7242   /* While we always get QImode from __atomic_test_and_set, we get
7243      other memory modes from __sync_lock_test_and_set.  Note that we
7244      use no endian adjustment here.  This matches the 4.6 behavior
7245      in the Sparc backend.  */
7246   gcc_checking_assert
7247     (insn_data[CODE_FOR_atomic_test_and_set].operand[1].mode == QImode);
7248   if (GET_MODE (mem) != QImode)
7249     mem = adjust_address_nv (mem, QImode, 0);
7250
7251   pat_bool_mode = insn_data[CODE_FOR_atomic_test_and_set].operand[0].mode;
7252   create_output_operand (&ops[0], target, pat_bool_mode);
7253   create_fixed_operand (&ops[1], mem);
7254   create_integer_operand (&ops[2], model);
7255
7256   if (maybe_expand_insn (CODE_FOR_atomic_test_and_set, 3, ops))
7257     return ops[0].value;
7258   return NULL_RTX;
7259 }
7260
7261 /* This function expands the legacy _sync_lock test_and_set operation which is
7262    generally an atomic exchange.  Some limited targets only allow the
7263    constant 1 to be stored.  This is an ACQUIRE operation.
7264
7265    TARGET is an optional place to stick the return value.
7266    MEM is where VAL is stored.  */
7267
7268 rtx
7269 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
7270 {
7271   rtx ret;
7272
7273   /* Try an atomic_exchange first.  */
7274   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_ACQUIRE);
7275   if (ret)
7276     return ret;
7277
7278   ret = maybe_emit_sync_lock_test_and_set (target, mem, val, MEMMODEL_ACQUIRE);
7279   if (ret)
7280     return ret;
7281
7282   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7283   if (ret)
7284     return ret;
7285
7286   /* If there are no other options, try atomic_test_and_set if the value
7287      being stored is 1.  */
7288   if (val == const1_rtx)
7289     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_ACQUIRE);
7290
7291   return ret;
7292 }
7293
7294 /* This function expands the atomic test_and_set operation:
7295    atomically store a boolean TRUE into MEM and return the previous value.
7296
7297    MEMMODEL is the memory model variant to use.
7298    TARGET is an optional place to stick the return value.  */
7299
7300 rtx
7301 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7302 {
7303   enum machine_mode mode = GET_MODE (mem);
7304   rtx ret, trueval, subtarget;
7305
7306   ret = maybe_emit_atomic_test_and_set (target, mem, model);
7307   if (ret)
7308     return ret;
7309
7310   /* Be binary compatible with non-default settings of trueval, and different
7311      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
7312      another only has atomic-exchange.  */
7313   if (targetm.atomic_test_and_set_trueval == 1)
7314     {
7315       trueval = const1_rtx;
7316       subtarget = target ? target : gen_reg_rtx (mode);
7317     }
7318   else
7319     {
7320       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
7321       subtarget = gen_reg_rtx (mode);
7322     }
7323
7324   /* Try the atomic-exchange optab...  */
7325   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
7326
7327   /* ... then an atomic-compare-and-swap loop ... */
7328   if (!ret)
7329     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
7330
7331   /* ... before trying the vaguely defined legacy lock_test_and_set. */
7332   if (!ret)
7333     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
7334
7335   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
7336      things with the value 1.  Thus we try again without trueval.  */
7337   if (!ret && targetm.atomic_test_and_set_trueval != 1)
7338     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
7339
7340   /* Failing all else, assume a single threaded environment and simply
7341      perform the operation.  */
7342   if (!ret)
7343     {
7344       /* If the result is ignored skip the move to target.  */
7345       if (subtarget != const0_rtx)
7346         emit_move_insn (subtarget, mem);
7347
7348       emit_move_insn (mem, trueval);
7349       ret = subtarget;
7350     }
7351
7352   /* Recall that have to return a boolean value; rectify if trueval
7353      is not exactly one.  */
7354   if (targetm.atomic_test_and_set_trueval != 1)
7355     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
7356
7357   return ret;
7358 }
7359
7360 /* This function expands the atomic exchange operation:
7361    atomically store VAL in MEM and return the previous value in MEM.
7362
7363    MEMMODEL is the memory model variant to use.
7364    TARGET is an optional place to stick the return value.  */
7365
7366 rtx
7367 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7368 {
7369   rtx ret;
7370
7371   ret = maybe_emit_atomic_exchange (target, mem, val, model);
7372
7373   /* Next try a compare-and-swap loop for the exchange.  */
7374   if (!ret)
7375     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7376
7377   return ret;
7378 }
7379
7380 /* This function expands the atomic compare exchange operation:
7381
7382    *PTARGET_BOOL is an optional place to store the boolean success/failure.
7383    *PTARGET_OVAL is an optional place to store the old value from memory.
7384    Both target parameters may be NULL to indicate that we do not care about
7385    that return value.  Both target parameters are updated on success to
7386    the actual location of the corresponding result.
7387
7388    MEMMODEL is the memory model variant to use.
7389
7390    The return value of the function is true for success.  */
7391
7392 bool
7393 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
7394                                 rtx mem, rtx expected, rtx desired,
7395                                 bool is_weak, enum memmodel succ_model,
7396                                 enum memmodel fail_model)
7397 {
7398   enum machine_mode mode = GET_MODE (mem);
7399   struct expand_operand ops[8];
7400   enum insn_code icode;
7401   rtx target_oval, target_bool = NULL_RTX;
7402   rtx libfunc;
7403
7404   /* Load expected into a register for the compare and swap.  */
7405   if (MEM_P (expected))
7406     expected = copy_to_reg (expected);
7407
7408   /* Make sure we always have some place to put the return oldval.
7409      Further, make sure that place is distinct from the input expected,
7410      just in case we need that path down below.  */
7411   if (ptarget_oval == NULL
7412       || (target_oval = *ptarget_oval) == NULL
7413       || reg_overlap_mentioned_p (expected, target_oval))
7414     target_oval = gen_reg_rtx (mode);
7415
7416   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7417   if (icode != CODE_FOR_nothing)
7418     {
7419       enum machine_mode bool_mode = insn_data[icode].operand[0].mode;
7420
7421       /* Make sure we always have a place for the bool operand.  */
7422       if (ptarget_bool == NULL
7423           || (target_bool = *ptarget_bool) == NULL
7424           || GET_MODE (target_bool) != bool_mode)
7425         target_bool = gen_reg_rtx (bool_mode);
7426
7427       /* Emit the compare_and_swap.  */
7428       create_output_operand (&ops[0], target_bool, bool_mode);
7429       create_output_operand (&ops[1], target_oval, mode);
7430       create_fixed_operand (&ops[2], mem);
7431       create_input_operand (&ops[3], expected, mode);
7432       create_input_operand (&ops[4], desired, mode);
7433       create_integer_operand (&ops[5], is_weak);
7434       create_integer_operand (&ops[6], succ_model);
7435       create_integer_operand (&ops[7], fail_model);
7436       if (maybe_expand_insn (icode, 8, ops))
7437         {
7438           /* Return success/failure.  */
7439           target_bool = ops[0].value;
7440           target_oval = ops[1].value;
7441           goto success;
7442         }
7443     }
7444
7445   /* Otherwise fall back to the original __sync_val_compare_and_swap
7446      which is always seq-cst.  */
7447   icode = optab_handler (sync_compare_and_swap_optab, mode);
7448   if (icode != CODE_FOR_nothing)
7449     {
7450       rtx cc_reg;
7451
7452       create_output_operand (&ops[0], target_oval, mode);
7453       create_fixed_operand (&ops[1], mem);
7454       create_input_operand (&ops[2], expected, mode);
7455       create_input_operand (&ops[3], desired, mode);
7456       if (!maybe_expand_insn (icode, 4, ops))
7457         return false;
7458
7459       target_oval = ops[0].value;
7460
7461       /* If the caller isn't interested in the boolean return value,
7462          skip the computation of it.  */
7463       if (ptarget_bool == NULL)
7464         goto success;
7465
7466       /* Otherwise, work out if the compare-and-swap succeeded.  */
7467       cc_reg = NULL_RTX;
7468       if (have_insn_for (COMPARE, CCmode))
7469         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
7470       if (cc_reg)
7471         {
7472           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
7473                                                const0_rtx, VOIDmode, 0, 1);
7474           goto success;
7475         }
7476       goto success_bool_from_val;
7477     }
7478
7479   /* Also check for library support for __sync_val_compare_and_swap.  */
7480   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
7481   if (libfunc != NULL)
7482     {
7483       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7484       target_oval = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7485                                              mode, 3, addr, ptr_mode,
7486                                              expected, mode, desired, mode);
7487
7488       /* Compute the boolean return value only if requested.  */
7489       if (ptarget_bool)
7490         goto success_bool_from_val;
7491       else
7492         goto success;
7493     }
7494
7495   /* Failure.  */
7496   return false;
7497
7498  success_bool_from_val:
7499    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
7500                                         expected, VOIDmode, 1, 1);
7501  success:
7502   /* Make sure that the oval output winds up where the caller asked.  */
7503   if (ptarget_oval)
7504     *ptarget_oval = target_oval;
7505   if (ptarget_bool)
7506     *ptarget_bool = target_bool;
7507   return true;
7508 }
7509
7510 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
7511
7512 static void
7513 expand_asm_memory_barrier (void)
7514 {
7515   rtx asm_op, clob;
7516
7517   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, empty_string, empty_string, 0,
7518                                  rtvec_alloc (0), rtvec_alloc (0),
7519                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7520   MEM_VOLATILE_P (asm_op) = 1;
7521
7522   clob = gen_rtx_SCRATCH (VOIDmode);
7523   clob = gen_rtx_MEM (BLKmode, clob);
7524   clob = gen_rtx_CLOBBER (VOIDmode, clob);
7525
7526   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
7527 }
7528
7529 /* This routine will either emit the mem_thread_fence pattern or issue a
7530    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7531
7532 #ifndef HAVE_mem_thread_fence
7533 # define HAVE_mem_thread_fence 0
7534 # define gen_mem_thread_fence(x) (gcc_unreachable (), NULL_RTX)
7535 #endif
7536 #ifndef HAVE_memory_barrier
7537 # define HAVE_memory_barrier 0
7538 # define gen_memory_barrier()  (gcc_unreachable (), NULL_RTX)
7539 #endif
7540
7541 void
7542 expand_mem_thread_fence (enum memmodel model)
7543 {
7544   if (HAVE_mem_thread_fence)
7545     emit_insn (gen_mem_thread_fence (GEN_INT (model)));
7546   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7547     {
7548       if (HAVE_memory_barrier)
7549         emit_insn (gen_memory_barrier ());
7550       else if (synchronize_libfunc != NULL_RTX)
7551         emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
7552       else
7553         expand_asm_memory_barrier ();
7554     }
7555 }
7556
7557 /* This routine will either emit the mem_signal_fence pattern or issue a
7558    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7559
7560 #ifndef HAVE_mem_signal_fence
7561 # define HAVE_mem_signal_fence 0
7562 # define gen_mem_signal_fence(x) (gcc_unreachable (), NULL_RTX)
7563 #endif
7564
7565 void
7566 expand_mem_signal_fence (enum memmodel model)
7567 {
7568   if (HAVE_mem_signal_fence)
7569     emit_insn (gen_mem_signal_fence (GEN_INT (model)));
7570   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7571     {
7572       /* By default targets are coherent between a thread and the signal
7573          handler running on the same thread.  Thus this really becomes a
7574          compiler barrier, in that stores must not be sunk past
7575          (or raised above) a given point.  */
7576       expand_asm_memory_barrier ();
7577     }
7578 }
7579
7580 /* This function expands the atomic load operation:
7581    return the atomically loaded value in MEM.
7582
7583    MEMMODEL is the memory model variant to use.
7584    TARGET is an option place to stick the return value.  */
7585
7586 rtx
7587 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
7588 {
7589   enum machine_mode mode = GET_MODE (mem);
7590   enum insn_code icode;
7591
7592   /* If the target supports the load directly, great.  */
7593   icode = direct_optab_handler (atomic_load_optab, mode);
7594   if (icode != CODE_FOR_nothing)
7595     {
7596       struct expand_operand ops[3];
7597
7598       create_output_operand (&ops[0], target, mode);
7599       create_fixed_operand (&ops[1], mem);
7600       create_integer_operand (&ops[2], model);
7601       if (maybe_expand_insn (icode, 3, ops))
7602         return ops[0].value;
7603     }
7604
7605   /* If the size of the object is greater than word size on this target,
7606      then we assume that a load will not be atomic.  */
7607   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7608     {
7609       /* Issue val = compare_and_swap (mem, 0, 0).
7610          This may cause the occasional harmless store of 0 when the value is
7611          already 0, but it seems to be OK according to the standards guys.  */
7612       if (expand_atomic_compare_and_swap (NULL, &target, mem, const0_rtx,
7613                                           const0_rtx, false, model, model))
7614         return target;
7615       else
7616       /* Otherwise there is no atomic load, leave the library call.  */
7617         return NULL_RTX;
7618     }
7619
7620   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
7621   if (!target || target == const0_rtx)
7622     target = gen_reg_rtx (mode);
7623
7624   /* For SEQ_CST, emit a barrier before the load.  */
7625   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7626     expand_mem_thread_fence (model);
7627
7628   emit_move_insn (target, mem);
7629
7630   /* Emit the appropriate barrier after the load.  */
7631   expand_mem_thread_fence (model);
7632
7633   return target;
7634 }
7635
7636 /* This function expands the atomic store operation:
7637    Atomically store VAL in MEM.
7638    MEMMODEL is the memory model variant to use.
7639    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
7640    function returns const0_rtx if a pattern was emitted.  */
7641
7642 rtx
7643 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
7644 {
7645   enum machine_mode mode = GET_MODE (mem);
7646   enum insn_code icode;
7647   struct expand_operand ops[3];
7648
7649   /* If the target supports the store directly, great.  */
7650   icode = direct_optab_handler (atomic_store_optab, mode);
7651   if (icode != CODE_FOR_nothing)
7652     {
7653       create_fixed_operand (&ops[0], mem);
7654       create_input_operand (&ops[1], val, mode);
7655       create_integer_operand (&ops[2], model);
7656       if (maybe_expand_insn (icode, 3, ops))
7657         return const0_rtx;
7658     }
7659
7660   /* If using __sync_lock_release is a viable alternative, try it.  */
7661   if (use_release)
7662     {
7663       icode = direct_optab_handler (sync_lock_release_optab, mode);
7664       if (icode != CODE_FOR_nothing)
7665         {
7666           create_fixed_operand (&ops[0], mem);
7667           create_input_operand (&ops[1], const0_rtx, mode);
7668           if (maybe_expand_insn (icode, 2, ops))
7669             {
7670               /* lock_release is only a release barrier.  */
7671               if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7672                 expand_mem_thread_fence (model);
7673               return const0_rtx;
7674             }
7675         }
7676     }
7677
7678   /* If the size of the object is greater than word size on this target,
7679      a default store will not be atomic, Try a mem_exchange and throw away
7680      the result.  If that doesn't work, don't do anything.  */
7681   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7682     {
7683       rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
7684       if (!target)
7685         target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem, val);
7686       if (target)
7687         return const0_rtx;
7688       else
7689         return NULL_RTX;
7690     }
7691
7692   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
7693   expand_mem_thread_fence (model);
7694
7695   emit_move_insn (mem, val);
7696
7697   /* For SEQ_CST, also emit a barrier after the store.  */
7698   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7699     expand_mem_thread_fence (model);
7700
7701   return const0_rtx;
7702 }
7703
7704
7705 /* Structure containing the pointers and values required to process the
7706    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
7707
7708 struct atomic_op_functions
7709 {
7710   direct_optab mem_fetch_before;
7711   direct_optab mem_fetch_after;
7712   direct_optab mem_no_result;
7713   optab fetch_before;
7714   optab fetch_after;
7715   direct_optab no_result;
7716   enum rtx_code reverse_code;
7717 };
7718
7719
7720 /* Fill in structure pointed to by OP with the various optab entries for an
7721    operation of type CODE.  */
7722
7723 static void
7724 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
7725 {
7726   gcc_assert (op!= NULL);
7727
7728   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
7729      in the source code during compilation, and the optab entries are not
7730      computable until runtime.  Fill in the values at runtime.  */
7731   switch (code)
7732     {
7733     case PLUS:
7734       op->mem_fetch_before = atomic_fetch_add_optab;
7735       op->mem_fetch_after = atomic_add_fetch_optab;
7736       op->mem_no_result = atomic_add_optab;
7737       op->fetch_before = sync_old_add_optab;
7738       op->fetch_after = sync_new_add_optab;
7739       op->no_result = sync_add_optab;
7740       op->reverse_code = MINUS;
7741       break;
7742     case MINUS:
7743       op->mem_fetch_before = atomic_fetch_sub_optab;
7744       op->mem_fetch_after = atomic_sub_fetch_optab;
7745       op->mem_no_result = atomic_sub_optab;
7746       op->fetch_before = sync_old_sub_optab;
7747       op->fetch_after = sync_new_sub_optab;
7748       op->no_result = sync_sub_optab;
7749       op->reverse_code = PLUS;
7750       break;
7751     case XOR:
7752       op->mem_fetch_before = atomic_fetch_xor_optab;
7753       op->mem_fetch_after = atomic_xor_fetch_optab;
7754       op->mem_no_result = atomic_xor_optab;
7755       op->fetch_before = sync_old_xor_optab;
7756       op->fetch_after = sync_new_xor_optab;
7757       op->no_result = sync_xor_optab;
7758       op->reverse_code = XOR;
7759       break;
7760     case AND:
7761       op->mem_fetch_before = atomic_fetch_and_optab;
7762       op->mem_fetch_after = atomic_and_fetch_optab;
7763       op->mem_no_result = atomic_and_optab;
7764       op->fetch_before = sync_old_and_optab;
7765       op->fetch_after = sync_new_and_optab;
7766       op->no_result = sync_and_optab;
7767       op->reverse_code = UNKNOWN;
7768       break;
7769     case IOR:
7770       op->mem_fetch_before = atomic_fetch_or_optab;
7771       op->mem_fetch_after = atomic_or_fetch_optab;
7772       op->mem_no_result = atomic_or_optab;
7773       op->fetch_before = sync_old_ior_optab;
7774       op->fetch_after = sync_new_ior_optab;
7775       op->no_result = sync_ior_optab;
7776       op->reverse_code = UNKNOWN;
7777       break;
7778     case NOT:
7779       op->mem_fetch_before = atomic_fetch_nand_optab;
7780       op->mem_fetch_after = atomic_nand_fetch_optab;
7781       op->mem_no_result = atomic_nand_optab;
7782       op->fetch_before = sync_old_nand_optab;
7783       op->fetch_after = sync_new_nand_optab;
7784       op->no_result = sync_nand_optab;
7785       op->reverse_code = UNKNOWN;
7786       break;
7787     default:
7788       gcc_unreachable ();
7789     }
7790 }
7791
7792 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
7793    using memory order MODEL.  If AFTER is true the operation needs to return
7794    the value of *MEM after the operation, otherwise the previous value.
7795    TARGET is an optional place to place the result.  The result is unused if
7796    it is const0_rtx.
7797    Return the result if there is a better sequence, otherwise NULL_RTX.  */
7798
7799 static rtx
7800 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7801                          enum memmodel model, bool after)
7802 {
7803   /* If the value is prefetched, or not used, it may be possible to replace
7804      the sequence with a native exchange operation.  */
7805   if (!after || target == const0_rtx)
7806     {
7807       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
7808       if (code == AND && val == const0_rtx)
7809         {
7810           if (target == const0_rtx)
7811             target = gen_reg_rtx (GET_MODE (mem));
7812           return maybe_emit_atomic_exchange (target, mem, val, model);
7813         }
7814
7815       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
7816       if (code == IOR && val == constm1_rtx)
7817         {
7818           if (target == const0_rtx)
7819             target = gen_reg_rtx (GET_MODE (mem));
7820           return maybe_emit_atomic_exchange (target, mem, val, model);
7821         }
7822     }
7823
7824   return NULL_RTX;
7825 }
7826
7827 /* Try to emit an instruction for a specific operation varaition.
7828    OPTAB contains the OP functions.
7829    TARGET is an optional place to return the result. const0_rtx means unused.
7830    MEM is the memory location to operate on.
7831    VAL is the value to use in the operation.
7832    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
7833    MODEL is the memory model, if used.
7834    AFTER is true if the returned result is the value after the operation.  */
7835
7836 static rtx
7837 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
7838                rtx val, bool use_memmodel, enum memmodel model, bool after)
7839 {
7840   enum machine_mode mode = GET_MODE (mem);
7841   struct expand_operand ops[4];
7842   enum insn_code icode;
7843   int op_counter = 0;
7844   int num_ops;
7845
7846   /* Check to see if there is a result returned.  */
7847   if (target == const0_rtx)
7848     {
7849       if (use_memmodel)
7850         {
7851           icode = direct_optab_handler (optab->mem_no_result, mode);
7852           create_integer_operand (&ops[2], model);
7853           num_ops = 3;
7854         }
7855       else
7856         {
7857           icode = direct_optab_handler (optab->no_result, mode);
7858           num_ops = 2;
7859         }
7860     }
7861   /* Otherwise, we need to generate a result.  */
7862   else
7863     {
7864       if (use_memmodel)
7865         {
7866           icode = direct_optab_handler (after ? optab->mem_fetch_after
7867                                         : optab->mem_fetch_before, mode);
7868           create_integer_operand (&ops[3], model);
7869           num_ops = 4;
7870         }
7871       else
7872         {
7873           icode = optab_handler (after ? optab->fetch_after
7874                                  : optab->fetch_before, mode);
7875           num_ops = 3;
7876         }
7877       create_output_operand (&ops[op_counter++], target, mode);
7878     }
7879   if (icode == CODE_FOR_nothing)
7880     return NULL_RTX;
7881
7882   create_fixed_operand (&ops[op_counter++], mem);
7883   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
7884   create_convert_operand_to (&ops[op_counter++], val, mode, true);
7885
7886   if (maybe_expand_insn (icode, num_ops, ops))
7887     return (target == const0_rtx ? const0_rtx : ops[0].value);
7888
7889   return NULL_RTX;
7890 }
7891
7892
7893 /* This function expands an atomic fetch_OP or OP_fetch operation:
7894    TARGET is an option place to stick the return value.  const0_rtx indicates
7895    the result is unused.
7896    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7897    CODE is the operation being performed (OP)
7898    MEMMODEL is the memory model variant to use.
7899    AFTER is true to return the result of the operation (OP_fetch).
7900    AFTER is false to return the value before the operation (fetch_OP).
7901
7902    This function will *only* generate instructions if there is a direct
7903    optab. No compare and swap loops or libcalls will be generated. */
7904
7905 static rtx
7906 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
7907                                     enum rtx_code code, enum memmodel model,
7908                                     bool after)
7909 {
7910   enum machine_mode mode = GET_MODE (mem);
7911   struct atomic_op_functions optab;
7912   rtx result;
7913   bool unused_result = (target == const0_rtx);
7914
7915   get_atomic_op_for_code (&optab, code);
7916
7917   /* Check to see if there are any better instructions.  */
7918   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
7919   if (result)
7920     return result;
7921
7922   /* Check for the case where the result isn't used and try those patterns.  */
7923   if (unused_result)
7924     {
7925       /* Try the memory model variant first.  */
7926       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
7927       if (result)
7928         return result;
7929
7930       /* Next try the old style withuot a memory model.  */
7931       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
7932       if (result)
7933         return result;
7934
7935       /* There is no no-result pattern, so try patterns with a result.  */
7936       target = NULL_RTX;
7937     }
7938
7939   /* Try the __atomic version.  */
7940   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
7941   if (result)
7942     return result;
7943
7944   /* Try the older __sync version.  */
7945   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
7946   if (result)
7947     return result;
7948
7949   /* If the fetch value can be calculated from the other variation of fetch,
7950      try that operation.  */
7951   if (after || unused_result || optab.reverse_code != UNKNOWN)
7952     {
7953       /* Try the __atomic version, then the older __sync version.  */
7954       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
7955       if (!result)
7956         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
7957
7958       if (result)
7959         {
7960           /* If the result isn't used, no need to do compensation code.  */
7961           if (unused_result)
7962             return result;
7963
7964           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
7965              Fetch_before == after REVERSE_OP val.  */
7966           if (!after)
7967             code = optab.reverse_code;
7968           if (code == NOT)
7969             {
7970               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
7971                                             true, OPTAB_LIB_WIDEN);
7972               result = expand_simple_unop (mode, NOT, result, target, true);
7973             }
7974           else
7975             result = expand_simple_binop (mode, code, result, val, target,
7976                                           true, OPTAB_LIB_WIDEN);
7977           return result;
7978         }
7979     }
7980
7981   /* No direct opcode can be generated.  */
7982   return NULL_RTX;
7983 }
7984
7985
7986
7987 /* This function expands an atomic fetch_OP or OP_fetch operation:
7988    TARGET is an option place to stick the return value.  const0_rtx indicates
7989    the result is unused.
7990    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7991    CODE is the operation being performed (OP)
7992    MEMMODEL is the memory model variant to use.
7993    AFTER is true to return the result of the operation (OP_fetch).
7994    AFTER is false to return the value before the operation (fetch_OP).  */
7995 rtx
7996 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7997                         enum memmodel model, bool after)
7998 {
7999   enum machine_mode mode = GET_MODE (mem);
8000   rtx result;
8001   bool unused_result = (target == const0_rtx);
8002
8003   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
8004                                                after);
8005
8006   if (result)
8007     return result;
8008
8009   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
8010   if (code == PLUS || code == MINUS)
8011     {
8012       rtx tmp;
8013       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
8014
8015       start_sequence ();
8016       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
8017       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
8018                                                    model, after);
8019       if (result)
8020         {
8021           /* PLUS worked so emit the insns and return.  */
8022           tmp = get_insns ();
8023           end_sequence ();
8024           emit_insn (tmp);
8025           return result;
8026         }
8027
8028       /* PLUS did not work, so throw away the negation code and continue.  */
8029       end_sequence ();
8030     }
8031
8032   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
8033   if (!can_compare_and_swap_p (mode, false))
8034     {
8035       rtx libfunc;
8036       bool fixup = false;
8037       enum rtx_code orig_code = code;
8038       struct atomic_op_functions optab;
8039
8040       get_atomic_op_for_code (&optab, code);
8041       libfunc = optab_libfunc (after ? optab.fetch_after
8042                                : optab.fetch_before, mode);
8043       if (libfunc == NULL
8044           && (after || unused_result || optab.reverse_code != UNKNOWN))
8045         {
8046           fixup = true;
8047           if (!after)
8048             code = optab.reverse_code;
8049           libfunc = optab_libfunc (after ? optab.fetch_before
8050                                    : optab.fetch_after, mode);
8051         }
8052       if (libfunc != NULL)
8053         {
8054           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
8055           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
8056                                             2, addr, ptr_mode, val, mode);
8057
8058           if (!unused_result && fixup)
8059             result = expand_simple_binop (mode, code, result, val, target,
8060                                           true, OPTAB_LIB_WIDEN);
8061           return result;
8062         }
8063
8064       /* We need the original code for any further attempts.  */
8065       code = orig_code;
8066     }
8067
8068   /* If nothing else has succeeded, default to a compare and swap loop.  */
8069   if (can_compare_and_swap_p (mode, true))
8070     {
8071       rtx insn;
8072       rtx t0 = gen_reg_rtx (mode), t1;
8073
8074       start_sequence ();
8075
8076       /* If the result is used, get a register for it.  */
8077       if (!unused_result)
8078         {
8079           if (!target || !register_operand (target, mode))
8080             target = gen_reg_rtx (mode);
8081           /* If fetch_before, copy the value now.  */
8082           if (!after)
8083             emit_move_insn (target, t0);
8084         }
8085       else
8086         target = const0_rtx;
8087
8088       t1 = t0;
8089       if (code == NOT)
8090         {
8091           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
8092                                     true, OPTAB_LIB_WIDEN);
8093           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
8094         }
8095       else
8096         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
8097                                   OPTAB_LIB_WIDEN);
8098
8099       /* For after, copy the value now.  */
8100       if (!unused_result && after)
8101         emit_move_insn (target, t1);
8102       insn = get_insns ();
8103       end_sequence ();
8104
8105       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
8106         return target;
8107     }
8108
8109   return NULL_RTX;
8110 }
8111 \f
8112 /* Return true if OPERAND is suitable for operand number OPNO of
8113    instruction ICODE.  */
8114
8115 bool
8116 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
8117 {
8118   return (!insn_data[(int) icode].operand[opno].predicate
8119           || (insn_data[(int) icode].operand[opno].predicate
8120               (operand, insn_data[(int) icode].operand[opno].mode)));
8121 }
8122 \f
8123 /* TARGET is a target of a multiword operation that we are going to
8124    implement as a series of word-mode operations.  Return true if
8125    TARGET is suitable for this purpose.  */
8126
8127 bool
8128 valid_multiword_target_p (rtx target)
8129 {
8130   enum machine_mode mode;
8131   int i;
8132
8133   mode = GET_MODE (target);
8134   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
8135     if (!validate_subreg (word_mode, mode, target, i))
8136       return false;
8137   return true;
8138 }
8139
8140 /* Like maybe_legitimize_operand, but do not change the code of the
8141    current rtx value.  */
8142
8143 static bool
8144 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
8145                                     struct expand_operand *op)
8146 {
8147   /* See if the operand matches in its current form.  */
8148   if (insn_operand_matches (icode, opno, op->value))
8149     return true;
8150
8151   /* If the operand is a memory whose address has no side effects,
8152      try forcing the address into a non-virtual pseudo register.
8153      The check for side effects is important because copy_to_mode_reg
8154      cannot handle things like auto-modified addresses.  */
8155   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
8156     {
8157       rtx addr, mem;
8158
8159       mem = op->value;
8160       addr = XEXP (mem, 0);
8161       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
8162           && !side_effects_p (addr))
8163         {
8164           rtx last;
8165           enum machine_mode mode;
8166
8167           last = get_last_insn ();
8168           mode = get_address_mode (mem);
8169           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
8170           if (insn_operand_matches (icode, opno, mem))
8171             {
8172               op->value = mem;
8173               return true;
8174             }
8175           delete_insns_since (last);
8176         }
8177     }
8178
8179   return false;
8180 }
8181
8182 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
8183    on success, storing the new operand value back in OP.  */
8184
8185 static bool
8186 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
8187                           struct expand_operand *op)
8188 {
8189   enum machine_mode mode, imode;
8190   bool old_volatile_ok, result;
8191
8192   mode = op->mode;
8193   switch (op->type)
8194     {
8195     case EXPAND_FIXED:
8196       old_volatile_ok = volatile_ok;
8197       volatile_ok = true;
8198       result = maybe_legitimize_operand_same_code (icode, opno, op);
8199       volatile_ok = old_volatile_ok;
8200       return result;
8201
8202     case EXPAND_OUTPUT:
8203       gcc_assert (mode != VOIDmode);
8204       if (op->value
8205           && op->value != const0_rtx
8206           && GET_MODE (op->value) == mode
8207           && maybe_legitimize_operand_same_code (icode, opno, op))
8208         return true;
8209
8210       op->value = gen_reg_rtx (mode);
8211       break;
8212
8213     case EXPAND_INPUT:
8214     input:
8215       gcc_assert (mode != VOIDmode);
8216       gcc_assert (GET_MODE (op->value) == VOIDmode
8217                   || GET_MODE (op->value) == mode);
8218       if (maybe_legitimize_operand_same_code (icode, opno, op))
8219         return true;
8220
8221       op->value = copy_to_mode_reg (mode, op->value);
8222       break;
8223
8224     case EXPAND_CONVERT_TO:
8225       gcc_assert (mode != VOIDmode);
8226       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
8227       goto input;
8228
8229     case EXPAND_CONVERT_FROM:
8230       if (GET_MODE (op->value) != VOIDmode)
8231         mode = GET_MODE (op->value);
8232       else
8233         /* The caller must tell us what mode this value has.  */
8234         gcc_assert (mode != VOIDmode);
8235
8236       imode = insn_data[(int) icode].operand[opno].mode;
8237       if (imode != VOIDmode && imode != mode)
8238         {
8239           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
8240           mode = imode;
8241         }
8242       goto input;
8243
8244     case EXPAND_ADDRESS:
8245       gcc_assert (mode != VOIDmode);
8246       op->value = convert_memory_address (mode, op->value);
8247       goto input;
8248
8249     case EXPAND_INTEGER:
8250       mode = insn_data[(int) icode].operand[opno].mode;
8251       if (mode != VOIDmode && const_int_operand (op->value, mode))
8252         goto input;
8253       break;
8254     }
8255   return insn_operand_matches (icode, opno, op->value);
8256 }
8257
8258 /* Make OP describe an input operand that should have the same value
8259    as VALUE, after any mode conversion that the target might request.
8260    TYPE is the type of VALUE.  */
8261
8262 void
8263 create_convert_operand_from_type (struct expand_operand *op,
8264                                   rtx value, tree type)
8265 {
8266   create_convert_operand_from (op, value, TYPE_MODE (type),
8267                                TYPE_UNSIGNED (type));
8268 }
8269
8270 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
8271    of instruction ICODE.  Return true on success, leaving the new operand
8272    values in the OPS themselves.  Emit no code on failure.  */
8273
8274 bool
8275 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
8276                            unsigned int nops, struct expand_operand *ops)
8277 {
8278   rtx last;
8279   unsigned int i;
8280
8281   last = get_last_insn ();
8282   for (i = 0; i < nops; i++)
8283     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
8284       {
8285         delete_insns_since (last);
8286         return false;
8287       }
8288   return true;
8289 }
8290
8291 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
8292    as its operands.  Return the instruction pattern on success,
8293    and emit any necessary set-up code.  Return null and emit no
8294    code on failure.  */
8295
8296 rtx
8297 maybe_gen_insn (enum insn_code icode, unsigned int nops,
8298                 struct expand_operand *ops)
8299 {
8300   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
8301   if (!maybe_legitimize_operands (icode, 0, nops, ops))
8302     return NULL_RTX;
8303
8304   switch (nops)
8305     {
8306     case 1:
8307       return GEN_FCN (icode) (ops[0].value);
8308     case 2:
8309       return GEN_FCN (icode) (ops[0].value, ops[1].value);
8310     case 3:
8311       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
8312     case 4:
8313       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8314                               ops[3].value);
8315     case 5:
8316       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8317                               ops[3].value, ops[4].value);
8318     case 6:
8319       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8320                               ops[3].value, ops[4].value, ops[5].value);
8321     case 7:
8322       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8323                               ops[3].value, ops[4].value, ops[5].value,
8324                               ops[6].value);
8325     case 8:
8326       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8327                               ops[3].value, ops[4].value, ops[5].value,
8328                               ops[6].value, ops[7].value);
8329     case 9:
8330       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8331                               ops[3].value, ops[4].value, ops[5].value,
8332                               ops[6].value, ops[7].value, ops[8].value);
8333     }
8334   gcc_unreachable ();
8335 }
8336
8337 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
8338    as its operands.  Return true on success and emit no code on failure.  */
8339
8340 bool
8341 maybe_expand_insn (enum insn_code icode, unsigned int nops,
8342                    struct expand_operand *ops)
8343 {
8344   rtx pat = maybe_gen_insn (icode, nops, ops);
8345   if (pat)
8346     {
8347       emit_insn (pat);
8348       return true;
8349     }
8350   return false;
8351 }
8352
8353 /* Like maybe_expand_insn, but for jumps.  */
8354
8355 bool
8356 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
8357                         struct expand_operand *ops)
8358 {
8359   rtx pat = maybe_gen_insn (icode, nops, ops);
8360   if (pat)
8361     {
8362       emit_jump_insn (pat);
8363       return true;
8364     }
8365   return false;
8366 }
8367
8368 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
8369    as its operands.  */
8370
8371 void
8372 expand_insn (enum insn_code icode, unsigned int nops,
8373              struct expand_operand *ops)
8374 {
8375   if (!maybe_expand_insn (icode, nops, ops))
8376     gcc_unreachable ();
8377 }
8378
8379 /* Like expand_insn, but for jumps.  */
8380
8381 void
8382 expand_jump_insn (enum insn_code icode, unsigned int nops,
8383                   struct expand_operand *ops)
8384 {
8385   if (!maybe_expand_jump_insn (icode, nops, ops))
8386     gcc_unreachable ();
8387 }
8388
8389 /* Reduce conditional compilation elsewhere.  */
8390 #ifndef HAVE_insv
8391 #define HAVE_insv       0
8392 #define CODE_FOR_insv   CODE_FOR_nothing
8393 #endif
8394 #ifndef HAVE_extv
8395 #define HAVE_extv       0
8396 #define CODE_FOR_extv   CODE_FOR_nothing
8397 #endif
8398 #ifndef HAVE_extzv
8399 #define HAVE_extzv      0
8400 #define CODE_FOR_extzv  CODE_FOR_nothing
8401 #endif
8402
8403 /* Enumerates the possible types of structure operand to an
8404    extraction_insn.  */
8405 enum extraction_type { ET_unaligned_mem, ET_reg };
8406
8407 /* Check whether insv, extv or extzv pattern ICODE can be used for an
8408    insertion or extraction of type TYPE on a structure of mode MODE.
8409    Return true if so and fill in *INSN accordingly.  STRUCT_OP is the
8410    operand number of the structure (the first sign_extract or zero_extract
8411    operand) and FIELD_OP is the operand number of the field (the other
8412    side of the set from the sign_extract or zero_extract).  */
8413
8414 static bool
8415 get_traditional_extraction_insn (extraction_insn *insn,
8416                                  enum extraction_type type,
8417                                  enum machine_mode mode,
8418                                  enum insn_code icode,
8419                                  int struct_op, int field_op)
8420 {
8421   const struct insn_data_d *data = &insn_data[icode];
8422
8423   enum machine_mode struct_mode = data->operand[struct_op].mode;
8424   if (struct_mode == VOIDmode)
8425     struct_mode = word_mode;
8426   if (mode != struct_mode)
8427     return false;
8428
8429   enum machine_mode field_mode = data->operand[field_op].mode;
8430   if (field_mode == VOIDmode)
8431     field_mode = word_mode;
8432
8433   enum machine_mode pos_mode = data->operand[struct_op + 2].mode;
8434   if (pos_mode == VOIDmode)
8435     pos_mode = word_mode;
8436
8437   insn->icode = icode;
8438   insn->field_mode = field_mode;
8439   insn->struct_mode = (type == ET_unaligned_mem ? byte_mode : struct_mode);
8440   insn->pos_mode = pos_mode;
8441   return true;
8442 }
8443
8444 /* Return true if an optab exists to perform an insertion or extraction
8445    of type TYPE in mode MODE.  Describe the instruction in *INSN if so.
8446
8447    REG_OPTAB is the optab to use for register structures and
8448    MISALIGN_OPTAB is the optab to use for misaligned memory structures.
8449    POS_OP is the operand number of the bit position.  */
8450
8451 static bool
8452 get_optab_extraction_insn (struct extraction_insn *insn,
8453                            enum extraction_type type,
8454                            enum machine_mode mode, direct_optab reg_optab,
8455                            direct_optab misalign_optab, int pos_op)
8456 {
8457   direct_optab optab = (type == ET_unaligned_mem ? misalign_optab : reg_optab);
8458   enum insn_code icode = direct_optab_handler (optab, mode);
8459   if (icode == CODE_FOR_nothing)
8460     return false;
8461
8462   const struct insn_data_d *data = &insn_data[icode];
8463
8464   insn->icode = icode;
8465   insn->field_mode = mode;
8466   insn->struct_mode = (type == ET_unaligned_mem ? BLKmode : mode);
8467   insn->pos_mode = data->operand[pos_op].mode;
8468   if (insn->pos_mode == VOIDmode)
8469     insn->pos_mode = word_mode;
8470   return true;
8471 }
8472
8473 /* Return true if an instruction exists to perform an insertion or
8474    extraction (PATTERN says which) of type TYPE in mode MODE.
8475    Describe the instruction in *INSN if so.  */
8476
8477 static bool
8478 get_extraction_insn (extraction_insn *insn,
8479                      enum extraction_pattern pattern,
8480                      enum extraction_type type,
8481                      enum machine_mode mode)
8482 {
8483   switch (pattern)
8484     {
8485     case EP_insv:
8486       if (HAVE_insv
8487           && get_traditional_extraction_insn (insn, type, mode,
8488                                               CODE_FOR_insv, 0, 3))
8489         return true;
8490       return get_optab_extraction_insn (insn, type, mode, insv_optab,
8491                                         insvmisalign_optab, 2);
8492
8493     case EP_extv:
8494       if (HAVE_extv
8495           && get_traditional_extraction_insn (insn, type, mode,
8496                                               CODE_FOR_extv, 1, 0))
8497         return true;
8498       return get_optab_extraction_insn (insn, type, mode, extv_optab,
8499                                         extvmisalign_optab, 3);
8500
8501     case EP_extzv:
8502       if (HAVE_extzv
8503           && get_traditional_extraction_insn (insn, type, mode,
8504                                               CODE_FOR_extzv, 1, 0))
8505         return true;
8506       return get_optab_extraction_insn (insn, type, mode, extzv_optab,
8507                                         extzvmisalign_optab, 3);
8508
8509     default:
8510       gcc_unreachable ();
8511     }
8512 }
8513
8514 /* Return true if an instruction exists to access a field of mode
8515    FIELDMODE in a structure that has STRUCT_BITS significant bits.
8516    Describe the "best" such instruction in *INSN if so.  PATTERN and
8517    TYPE describe the type of insertion or extraction we want to perform.
8518
8519    For an insertion, the number of significant structure bits includes
8520    all bits of the target.  For an extraction, it need only include the
8521    most significant bit of the field.  Larger widths are acceptable
8522    in both cases.  */
8523
8524 static bool
8525 get_best_extraction_insn (extraction_insn *insn,
8526                           enum extraction_pattern pattern,
8527                           enum extraction_type type,
8528                           unsigned HOST_WIDE_INT struct_bits,
8529                           enum machine_mode field_mode)
8530 {
8531   enum machine_mode mode = smallest_mode_for_size (struct_bits, MODE_INT);
8532   while (mode != VOIDmode)
8533     {
8534       if (get_extraction_insn (insn, pattern, type, mode))
8535         {
8536           while (mode != VOIDmode
8537                  && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (field_mode)
8538                  && !TRULY_NOOP_TRUNCATION_MODES_P (insn->field_mode,
8539                                                     field_mode))
8540             {
8541               get_extraction_insn (insn, pattern, type, mode);
8542               mode = GET_MODE_WIDER_MODE (mode);
8543             }
8544           return true;
8545         }
8546       mode = GET_MODE_WIDER_MODE (mode);
8547     }
8548   return false;
8549 }
8550
8551 /* Return true if an instruction exists to access a field of mode
8552    FIELDMODE in a register structure that has STRUCT_BITS significant bits.
8553    Describe the "best" such instruction in *INSN if so.  PATTERN describes
8554    the type of insertion or extraction we want to perform.
8555
8556    For an insertion, the number of significant structure bits includes
8557    all bits of the target.  For an extraction, it need only include the
8558    most significant bit of the field.  Larger widths are acceptable
8559    in both cases.  */
8560
8561 bool
8562 get_best_reg_extraction_insn (extraction_insn *insn,
8563                               enum extraction_pattern pattern,
8564                               unsigned HOST_WIDE_INT struct_bits,
8565                               enum machine_mode field_mode)
8566 {
8567   return get_best_extraction_insn (insn, pattern, ET_reg, struct_bits,
8568                                    field_mode);
8569 }
8570
8571 /* Return true if an instruction exists to access a field of BITSIZE
8572    bits starting BITNUM bits into a memory structure.  Describe the
8573    "best" such instruction in *INSN if so.  PATTERN describes the type
8574    of insertion or extraction we want to perform and FIELDMODE is the
8575    natural mode of the extracted field.
8576
8577    The instructions considered here only access bytes that overlap
8578    the bitfield; they do not touch any surrounding bytes.  */
8579
8580 bool
8581 get_best_mem_extraction_insn (extraction_insn *insn,
8582                               enum extraction_pattern pattern,
8583                               HOST_WIDE_INT bitsize, HOST_WIDE_INT bitnum,
8584                               enum machine_mode field_mode)
8585 {
8586   unsigned HOST_WIDE_INT struct_bits = (bitnum % BITS_PER_UNIT
8587                                         + bitsize
8588                                         + BITS_PER_UNIT - 1);
8589   struct_bits -= struct_bits % BITS_PER_UNIT;
8590   return get_best_extraction_insn (insn, pattern, ET_unaligned_mem,
8591                                    struct_bits, field_mode);
8592 }
8593
8594 #include "gt-optabs.h"