gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2014 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "tm.h"
  25 #include "diagnostic-core.h"
  26
  27 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  28    is properly defined.  */
  29 #include "insn-config.h"
  30 #include "rtl.h"
  31 #include "tree.h"
  32 #include "tree-hasher.h"
  33 #include "stor-layout.h"
  34 #include "stringpool.h"
  35 #include "varasm.h"
  36 #include "tm_p.h"
  37 #include "flags.h"
  38 #include "function.h"
  39 #include "except.h"
  40 #include "expr.h"
  41 #include "optabs.h"
  42 #include "libfuncs.h"
  43 #include "recog.h"
  44 #include "reload.h"
  45 #include "ggc.h"
  46 #include "basic-block.h"
  47 #include "target.h"
  48
  49 struct target_optabs default_target_optabs;
  50 struct target_libfuncs default_target_libfuncs;
  51 struct target_optabs *this_fn_optabs = &default_target_optabs;
  52 #if SWITCHABLE_TARGET
  53 struct target_optabs *this_target_optabs = &default_target_optabs;
  54 struct target_libfuncs *this_target_libfuncs = &default_target_libfuncs;
  55 #endif
  56
  57 #define libfunc_hash \
  58   (this_target_libfuncs->x_libfunc_hash)
  59
  60 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  61                                    enum machine_mode *);
  62 static rtx expand_unop_direct (enum machine_mode, optab, rtx, rtx, int);
  63 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  64
  65 /* Debug facility for use in GDB.  */
  66 void debug_optab_libfuncs (void);
  67
  68 /* Prefixes for the current version of decimal floating point (BID vs. DPD) */
  69 #if ENABLE_DECIMAL_BID_FORMAT
  70 #define DECIMAL_PREFIX "bid_"
  71 #else
  72 #define DECIMAL_PREFIX "dpd_"
  73 #endif
  74 \f
  75 /* Used for libfunc_hash.  */
  76
  77 hashval_t
  78 libfunc_hasher::hash (libfunc_entry *e)
  79 {
  80   return ((e->mode1 + e->mode2 * NUM_MACHINE_MODES) ^ e->op);
  81 }
  82
  83 /* Used for libfunc_hash.  */
  84
  85 bool
  86 libfunc_hasher::equal (libfunc_entry *e1, libfunc_entry *e2)
  87 {
  88   return e1->op == e2->op && e1->mode1 == e2->mode1 && e1->mode2 == e2->mode2;
  89 }
  90
  91 /* Return libfunc corresponding operation defined by OPTAB converting
  92    from MODE2 to MODE1.  Trigger lazy initialization if needed, return NULL
  93    if no libfunc is available.  */
  94 rtx
  95 convert_optab_libfunc (convert_optab optab, enum machine_mode mode1,
  96                        enum machine_mode mode2)
  97 {
  98   struct libfunc_entry e;
  99   struct libfunc_entry **slot;
 100
 101   /* ??? This ought to be an assert, but not all of the places
 102      that we expand optabs know about the optabs that got moved
 103      to being direct.  */
 104   if (!(optab >= FIRST_CONV_OPTAB && optab <= LAST_CONVLIB_OPTAB))
 105     return NULL_RTX;
 106
 107   e.op = optab;
 108   e.mode1 = mode1;
 109   e.mode2 = mode2;
 110   slot = libfunc_hash->find_slot (&e, NO_INSERT);
 111   if (!slot)
 112     {
 113       const struct convert_optab_libcall_d *d
 114         = &convlib_def[optab - FIRST_CONV_OPTAB];
 115
 116       if (d->libcall_gen == NULL)
 117         return NULL;
 118
 119       d->libcall_gen (optab, d->libcall_basename, mode1, mode2);
 120       slot = libfunc_hash->find_slot (&e, NO_INSERT);
 121       if (!slot)
 122         return NULL;
 123     }
 124   return (*slot)->libfunc;
 125 }
 126
 127 /* Return libfunc corresponding operation defined by OPTAB in MODE.
 128    Trigger lazy initialization if needed, return NULL if no libfunc is
 129    available.  */
 130 rtx
 131 optab_libfunc (optab optab, enum machine_mode mode)
 132 {
 133   struct libfunc_entry e;
 134   struct libfunc_entry **slot;
 135
 136   /* ??? This ought to be an assert, but not all of the places
 137      that we expand optabs know about the optabs that got moved
 138      to being direct.  */
 139   if (!(optab >= FIRST_NORM_OPTAB && optab <= LAST_NORMLIB_OPTAB))
 140     return NULL_RTX;
 141
 142   e.op = optab;
 143   e.mode1 = mode;
 144   e.mode2 = VOIDmode;
 145   slot = libfunc_hash->find_slot (&e, NO_INSERT);
 146   if (!slot)
 147     {
 148       const struct optab_libcall_d *d
 149         = &normlib_def[optab - FIRST_NORM_OPTAB];
 150
 151       if (d->libcall_gen == NULL)
 152         return NULL;
 153
 154       d->libcall_gen (optab, d->libcall_basename, d->libcall_suffix, mode);
 155       slot = libfunc_hash->find_slot (&e, NO_INSERT);
 156       if (!slot)
 157         return NULL;
 158     }
 159   return (*slot)->libfunc;
 160 }
 161
 162 \f
 163 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
 164    the result of operation CODE applied to OP0 (and OP1 if it is a binary
 165    operation).
 166
 167    If the last insn does not set TARGET, don't do anything, but return 1.
 168
 169    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
 170    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
 171    try again, ensuring that TARGET is not one of the operands.  */
 172
 173 static int
 174 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
 175 {
 176   rtx_insn *last_insn;
 177   rtx set;
 178   rtx note;
 179
 180   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
 181
 182   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
 183       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
 184       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
 185       && GET_RTX_CLASS (code) != RTX_COMPARE
 186       && GET_RTX_CLASS (code) != RTX_UNARY)
 187     return 1;
 188
 189   if (GET_CODE (target) == ZERO_EXTRACT)
 190     return 1;
 191
 192   for (last_insn = insns;
 193        NEXT_INSN (last_insn) != NULL_RTX;
 194        last_insn = NEXT_INSN (last_insn))
 195     ;
 196
 197   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
 198      a value changing in the insn, so the note would be invalid for CSE.  */
 199   if (reg_overlap_mentioned_p (target, op0)
 200       || (op1 && reg_overlap_mentioned_p (target, op1)))
 201     {
 202       if (MEM_P (target)
 203           && (rtx_equal_p (target, op0)
 204               || (op1 && rtx_equal_p (target, op1))))
 205         {
 206           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 207              over expanding it as temp = MEM op X, MEM = temp.  If the target
 208              supports MEM = MEM op X instructions, it is sometimes too hard
 209              to reconstruct that form later, especially if X is also a memory,
 210              and due to multiple occurrences of addresses the address might
 211              be forced into register unnecessarily.
 212              Note that not emitting the REG_EQUIV note might inhibit
 213              CSE in some cases.  */
 214           set = single_set (last_insn);
 215           if (set
 216               && GET_CODE (SET_SRC (set)) == code
 217               && MEM_P (SET_DEST (set))
 218               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 219                   || (op1 && rtx_equal_p (SET_DEST (set),
 220                                           XEXP (SET_SRC (set), 1)))))
 221             return 1;
 222         }
 223       return 0;
 224     }
 225
 226   set = set_for_reg_notes (last_insn);
 227   if (set == NULL_RTX)
 228     return 1;
 229
 230   if (! rtx_equal_p (SET_DEST (set), target)
 231       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 232       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 233           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 234     return 1;
 235
 236   if (GET_RTX_CLASS (code) == RTX_UNARY)
 237     switch (code)
 238       {
 239       case FFS:
 240       case CLZ:
 241       case CTZ:
 242       case CLRSB:
 243       case POPCOUNT:
 244       case PARITY:
 245       case BSWAP:
 246         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 247           {
 248             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 249             if (GET_MODE_SIZE (GET_MODE (op0))
 250                 > GET_MODE_SIZE (GET_MODE (target)))
 251               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 252                                          note, GET_MODE (op0));
 253             else
 254               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 255                                          note, GET_MODE (op0));
 256             break;
 257           }
 258         /* FALLTHRU */
 259       default:
 260         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 261         break;
 262       }
 263   else
 264     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 265
 266   set_unique_reg_note (last_insn, REG_EQUAL, note);
 267
 268   return 1;
 269 }
 270 \f
 271 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 272    for a widening operation would be.  In most cases this would be OP0, but if
 273    that's a constant it'll be VOIDmode, which isn't useful.  */
 274
 275 static enum machine_mode
 276 widened_mode (enum machine_mode to_mode, rtx op0, rtx op1)
 277 {
 278   enum machine_mode m0 = GET_MODE (op0);
 279   enum machine_mode m1 = GET_MODE (op1);
 280   enum machine_mode result;
 281
 282   if (m0 == VOIDmode && m1 == VOIDmode)
 283     return to_mode;
 284   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 285     result = m1;
 286   else
 287     result = m0;
 288
 289   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 290     return to_mode;
 291
 292   return result;
 293 }
 294 \f
 295 /* Like optab_handler, but for widening_operations that have a
 296    TO_MODE and a FROM_MODE.  */
 297
 298 enum insn_code
 299 widening_optab_handler (optab op, enum machine_mode to_mode,
 300                         enum machine_mode from_mode)
 301 {
 302   unsigned scode = (op << 16) | to_mode;
 303   if (to_mode != from_mode && from_mode != VOIDmode)
 304     {
 305       /* ??? Why does find_widening_optab_handler_and_mode attempt to
 306          widen things that can't be widened?  E.g. add_optab... */
 307       if (op > LAST_CONV_OPTAB)
 308         return CODE_FOR_nothing;
 309       scode |= from_mode << 8;
 310     }
 311   return raw_optab_handler (scode);
 312 }
 313
 314 /* Find a widening optab even if it doesn't widen as much as we want.
 315    E.g. if from_mode is HImode, and to_mode is DImode, and there is no
 316    direct HI->SI insn, then return SI->DI, if that exists.
 317    If PERMIT_NON_WIDENING is non-zero then this can be used with
 318    non-widening optabs also.  */
 319
 320 enum insn_code
 321 find_widening_optab_handler_and_mode (optab op, enum machine_mode to_mode,
 322                                       enum machine_mode from_mode,
 323                                       int permit_non_widening,
 324                                       enum machine_mode *found_mode)
 325 {
 326   for (; (permit_non_widening || from_mode != to_mode)
 327          && GET_MODE_SIZE (from_mode) <= GET_MODE_SIZE (to_mode)
 328          && from_mode != VOIDmode;
 329        from_mode = GET_MODE_WIDER_MODE (from_mode))
 330     {
 331       enum insn_code handler = widening_optab_handler (op, to_mode,
 332                                                        from_mode);
 333
 334       if (handler != CODE_FOR_nothing)
 335         {
 336           if (found_mode)
 337             *found_mode = from_mode;
 338           return handler;
 339         }
 340     }
 341
 342   return CODE_FOR_nothing;
 343 }
 344 \f
 345 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 346    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 347    not actually do a sign-extend or zero-extend, but can leave the
 348    higher-order bits of the result rtx undefined, for example, in the case
 349    of logical operations, but not right shifts.  */
 350
 351 static rtx
 352 widen_operand (rtx op, enum machine_mode mode, enum machine_mode oldmode,
 353                int unsignedp, int no_extend)
 354 {
 355   rtx result;
 356
 357   /* If we don't have to extend and this is a constant, return it.  */
 358   if (no_extend && GET_MODE (op) == VOIDmode)
 359     return op;
 360
 361   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 362      extend since it will be more efficient to do so unless the signedness of
 363      a promoted object differs from our extension.  */
 364   if (! no_extend
 365       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 366           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 367     return convert_modes (mode, oldmode, op, unsignedp);
 368
 369   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 370      SUBREG.  */
 371   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
 372     return gen_lowpart (mode, force_reg (GET_MODE (op), op));
 373
 374   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 375      part to OP.  */
 376
 377   result = gen_reg_rtx (mode);
 378   emit_clobber (result);
 379   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 380   return result;
 381 }
 382 \f
 383 /* Return the optab used for computing the operation given by the tree code,
 384    CODE and the tree EXP.  This function is not always usable (for example, it
 385    cannot give complete results for multiplication or division) but probably
 386    ought to be relied on more widely throughout the expander.  */
 387 optab
 388 optab_for_tree_code (enum tree_code code, const_tree type,
 389                      enum optab_subtype subtype)
 390 {
 391   bool trapv;
 392   switch (code)
 393     {
 394     case BIT_AND_EXPR:
 395       return and_optab;
 396
 397     case BIT_IOR_EXPR:
 398       return ior_optab;
 399
 400     case BIT_NOT_EXPR:
 401       return one_cmpl_optab;
 402
 403     case BIT_XOR_EXPR:
 404       return xor_optab;
 405
 406     case MULT_HIGHPART_EXPR:
 407       return TYPE_UNSIGNED (type) ? umul_highpart_optab : smul_highpart_optab;
 408
 409     case TRUNC_MOD_EXPR:
 410     case CEIL_MOD_EXPR:
 411     case FLOOR_MOD_EXPR:
 412     case ROUND_MOD_EXPR:
 413       return TYPE_UNSIGNED (type) ? umod_optab : smod_optab;
 414
 415     case RDIV_EXPR:
 416     case TRUNC_DIV_EXPR:
 417     case CEIL_DIV_EXPR:
 418     case FLOOR_DIV_EXPR:
 419     case ROUND_DIV_EXPR:
 420     case EXACT_DIV_EXPR:
 421       if (TYPE_SATURATING (type))
 422         return TYPE_UNSIGNED (type) ? usdiv_optab : ssdiv_optab;
 423       return TYPE_UNSIGNED (type) ? udiv_optab : sdiv_optab;
 424
 425     case LSHIFT_EXPR:
 426       if (TREE_CODE (type) == VECTOR_TYPE)
 427         {
 428           if (subtype == optab_vector)
 429             return TYPE_SATURATING (type) ? unknown_optab : vashl_optab;
 430
 431           gcc_assert (subtype == optab_scalar);
 432         }
 433       if (TYPE_SATURATING (type))
 434         return TYPE_UNSIGNED (type) ? usashl_optab : ssashl_optab;
 435       return ashl_optab;
 436
 437     case RSHIFT_EXPR:
 438       if (TREE_CODE (type) == VECTOR_TYPE)
 439         {
 440           if (subtype == optab_vector)
 441             return TYPE_UNSIGNED (type) ? vlshr_optab : vashr_optab;
 442
 443           gcc_assert (subtype == optab_scalar);
 444         }
 445       return TYPE_UNSIGNED (type) ? lshr_optab : ashr_optab;
 446
 447     case LROTATE_EXPR:
 448       if (TREE_CODE (type) == VECTOR_TYPE)
 449         {
 450           if (subtype == optab_vector)
 451             return vrotl_optab;
 452
 453           gcc_assert (subtype == optab_scalar);
 454         }
 455       return rotl_optab;
 456
 457     case RROTATE_EXPR:
 458       if (TREE_CODE (type) == VECTOR_TYPE)
 459         {
 460           if (subtype == optab_vector)
 461             return vrotr_optab;
 462
 463           gcc_assert (subtype == optab_scalar);
 464         }
 465       return rotr_optab;
 466
 467     case MAX_EXPR:
 468       return TYPE_UNSIGNED (type) ? umax_optab : smax_optab;
 469
 470     case MIN_EXPR:
 471       return TYPE_UNSIGNED (type) ? umin_optab : smin_optab;
 472
 473     case REALIGN_LOAD_EXPR:
 474       return vec_realign_load_optab;
 475
 476     case WIDEN_SUM_EXPR:
 477       return TYPE_UNSIGNED (type) ? usum_widen_optab : ssum_widen_optab;
 478
 479     case DOT_PROD_EXPR:
 480       return TYPE_UNSIGNED (type) ? udot_prod_optab : sdot_prod_optab;
 481
 482     case SAD_EXPR:
 483       return TYPE_UNSIGNED (type) ? usad_optab : ssad_optab;
 484
 485     case WIDEN_MULT_PLUS_EXPR:
 486       return (TYPE_UNSIGNED (type)
 487               ? (TYPE_SATURATING (type)
 488                  ? usmadd_widen_optab : umadd_widen_optab)
 489               : (TYPE_SATURATING (type)
 490                  ? ssmadd_widen_optab : smadd_widen_optab));
 491
 492     case WIDEN_MULT_MINUS_EXPR:
 493       return (TYPE_UNSIGNED (type)
 494               ? (TYPE_SATURATING (type)
 495                  ? usmsub_widen_optab : umsub_widen_optab)
 496               : (TYPE_SATURATING (type)
 497                  ? ssmsub_widen_optab : smsub_widen_optab));
 498
 499     case FMA_EXPR:
 500       return fma_optab;
 501
 502     case REDUC_MAX_EXPR:
 503       return TYPE_UNSIGNED (type) ? reduc_umax_optab : reduc_smax_optab;
 504
 505     case REDUC_MIN_EXPR:
 506       return TYPE_UNSIGNED (type) ? reduc_umin_optab : reduc_smin_optab;
 507
 508     case REDUC_PLUS_EXPR:
 509       return TYPE_UNSIGNED (type) ? reduc_uplus_optab : reduc_splus_optab;
 510
 511     case VEC_LSHIFT_EXPR:
 512       return vec_shl_optab;
 513
 514     case VEC_RSHIFT_EXPR:
 515       return vec_shr_optab;
 516
 517     case VEC_WIDEN_MULT_HI_EXPR:
 518       return TYPE_UNSIGNED (type) ?
 519         vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
 520
 521     case VEC_WIDEN_MULT_LO_EXPR:
 522       return TYPE_UNSIGNED (type) ?
 523         vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
 524
 525     case VEC_WIDEN_MULT_EVEN_EXPR:
 526       return TYPE_UNSIGNED (type) ?
 527         vec_widen_umult_even_optab : vec_widen_smult_even_optab;
 528
 529     case VEC_WIDEN_MULT_ODD_EXPR:
 530       return TYPE_UNSIGNED (type) ?
 531         vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
 532
 533     case VEC_WIDEN_LSHIFT_HI_EXPR:
 534       return TYPE_UNSIGNED (type) ?
 535         vec_widen_ushiftl_hi_optab : vec_widen_sshiftl_hi_optab;
 536
 537     case VEC_WIDEN_LSHIFT_LO_EXPR:
 538       return TYPE_UNSIGNED (type) ?
 539         vec_widen_ushiftl_lo_optab : vec_widen_sshiftl_lo_optab;
 540
 541     case VEC_UNPACK_HI_EXPR:
 542       return TYPE_UNSIGNED (type) ?
 543         vec_unpacku_hi_optab : vec_unpacks_hi_optab;
 544
 545     case VEC_UNPACK_LO_EXPR:
 546       return TYPE_UNSIGNED (type) ?
 547         vec_unpacku_lo_optab : vec_unpacks_lo_optab;
 548
 549     case VEC_UNPACK_FLOAT_HI_EXPR:
 550       /* The signedness is determined from input operand.  */
 551       return TYPE_UNSIGNED (type) ?
 552         vec_unpacku_float_hi_optab : vec_unpacks_float_hi_optab;
 553
 554     case VEC_UNPACK_FLOAT_LO_EXPR:
 555       /* The signedness is determined from input operand.  */
 556       return TYPE_UNSIGNED (type) ?
 557         vec_unpacku_float_lo_optab : vec_unpacks_float_lo_optab;
 558
 559     case VEC_PACK_TRUNC_EXPR:
 560       return vec_pack_trunc_optab;
 561
 562     case VEC_PACK_SAT_EXPR:
 563       return TYPE_UNSIGNED (type) ? vec_pack_usat_optab : vec_pack_ssat_optab;
 564
 565     case VEC_PACK_FIX_TRUNC_EXPR:
 566       /* The signedness is determined from output operand.  */
 567       return TYPE_UNSIGNED (type) ?
 568         vec_pack_ufix_trunc_optab : vec_pack_sfix_trunc_optab;
 569
 570     default:
 571       break;
 572     }
 573
 574   trapv = INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type);
 575   switch (code)
 576     {
 577     case POINTER_PLUS_EXPR:
 578     case PLUS_EXPR:
 579       if (TYPE_SATURATING (type))
 580         return TYPE_UNSIGNED (type) ? usadd_optab : ssadd_optab;
 581       return trapv ? addv_optab : add_optab;
 582
 583     case MINUS_EXPR:
 584       if (TYPE_SATURATING (type))
 585         return TYPE_UNSIGNED (type) ? ussub_optab : sssub_optab;
 586       return trapv ? subv_optab : sub_optab;
 587
 588     case MULT_EXPR:
 589       if (TYPE_SATURATING (type))
 590         return TYPE_UNSIGNED (type) ? usmul_optab : ssmul_optab;
 591       return trapv ? smulv_optab : smul_optab;
 592
 593     case NEGATE_EXPR:
 594       if (TYPE_SATURATING (type))
 595         return TYPE_UNSIGNED (type) ? usneg_optab : ssneg_optab;
 596       return trapv ? negv_optab : neg_optab;
 597
 598     case ABS_EXPR:
 599       return trapv ? absv_optab : abs_optab;
 600
 601     default:
 602       return unknown_optab;
 603     }
 604 }
 605 \f
 606
 607 /* Expand vector widening operations.
 608
 609    There are two different classes of operations handled here:
 610    1) Operations whose result is wider than all the arguments to the operation.
 611       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 612       In this case OP0 and optionally OP1 would be initialized,
 613       but WIDE_OP wouldn't (not relevant for this case).
 614    2) Operations whose result is of the same size as the last argument to the
 615       operation, but wider than all the other arguments to the operation.
 616       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 617       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 618
 619    E.g, when called to expand the following operations, this is how
 620    the arguments will be initialized:
 621                                 nops    OP0     OP1     WIDE_OP
 622    widening-sum                 2       oprnd0  -       oprnd1
 623    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 624    widening-mult                2       oprnd0  oprnd1  -
 625    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 626
 627 rtx
 628 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 629                            rtx target, int unsignedp)
 630 {
 631   struct expand_operand eops[4];
 632   tree oprnd0, oprnd1, oprnd2;
 633   enum machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 634   optab widen_pattern_optab;
 635   enum insn_code icode;
 636   int nops = TREE_CODE_LENGTH (ops->code);
 637   int op;
 638
 639   oprnd0 = ops->op0;
 640   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 641   widen_pattern_optab =
 642     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 643   if (ops->code == WIDEN_MULT_PLUS_EXPR
 644       || ops->code == WIDEN_MULT_MINUS_EXPR)
 645     icode = find_widening_optab_handler (widen_pattern_optab,
 646                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 647                                          tmode0, 0);
 648   else
 649     icode = optab_handler (widen_pattern_optab, tmode0);
 650   gcc_assert (icode != CODE_FOR_nothing);
 651
 652   if (nops >= 2)
 653     {
 654       oprnd1 = ops->op1;
 655       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 656     }
 657
 658   /* The last operand is of a wider mode than the rest of the operands.  */
 659   if (nops == 2)
 660     wmode = tmode1;
 661   else if (nops == 3)
 662     {
 663       gcc_assert (tmode1 == tmode0);
 664       gcc_assert (op1);
 665       oprnd2 = ops->op2;
 666       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 667     }
 668
 669   op = 0;
 670   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 671   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 672   if (op1)
 673     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 674   if (wide_op)
 675     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 676   expand_insn (icode, op, eops);
 677   return eops[0].value;
 678 }
 679
 680 /* Generate code to perform an operation specified by TERNARY_OPTAB
 681    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 682
 683    UNSIGNEDP is for the case where we have to widen the operands
 684    to perform the operation.  It says to use zero-extension.
 685
 686    If TARGET is nonzero, the value
 687    is generated there, if it is convenient to do so.
 688    In all cases an rtx is returned for the locus of the value;
 689    this may or may not be TARGET.  */
 690
 691 rtx
 692 expand_ternary_op (enum machine_mode mode, optab ternary_optab, rtx op0,
 693                    rtx op1, rtx op2, rtx target, int unsignedp)
 694 {
 695   struct expand_operand ops[4];
 696   enum insn_code icode = optab_handler (ternary_optab, mode);
 697
 698   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 699
 700   create_output_operand (&ops[0], target, mode);
 701   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 702   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 703   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 704   expand_insn (icode, 4, ops);
 705   return ops[0].value;
 706 }
 707
 708
 709 /* Like expand_binop, but return a constant rtx if the result can be
 710    calculated at compile time.  The arguments and return value are
 711    otherwise the same as for expand_binop.  */
 712
 713 rtx
 714 simplify_expand_binop (enum machine_mode mode, optab binoptab,
 715                        rtx op0, rtx op1, rtx target, int unsignedp,
 716                        enum optab_methods methods)
 717 {
 718   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 719     {
 720       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 721                                          mode, op0, op1);
 722       if (x)
 723         return x;
 724     }
 725
 726   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 727 }
 728
 729 /* Like simplify_expand_binop, but always put the result in TARGET.
 730    Return true if the expansion succeeded.  */
 731
 732 bool
 733 force_expand_binop (enum machine_mode mode, optab binoptab,
 734                     rtx op0, rtx op1, rtx target, int unsignedp,
 735                     enum optab_methods methods)
 736 {
 737   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 738                                  target, unsignedp, methods);
 739   if (x == 0)
 740     return false;
 741   if (x != target)
 742     emit_move_insn (target, x);
 743   return true;
 744 }
 745
 746 /* Generate insns for VEC_LSHIFT_EXPR, VEC_RSHIFT_EXPR.  */
 747
 748 rtx
 749 expand_vec_shift_expr (sepops ops, rtx target)
 750 {
 751   struct expand_operand eops[3];
 752   enum insn_code icode;
 753   rtx rtx_op1, rtx_op2;
 754   enum machine_mode mode = TYPE_MODE (ops->type);
 755   tree vec_oprnd = ops->op0;
 756   tree shift_oprnd = ops->op1;
 757   optab shift_optab;
 758
 759   switch (ops->code)
 760     {
 761       case VEC_RSHIFT_EXPR:
 762         shift_optab = vec_shr_optab;
 763         break;
 764       case VEC_LSHIFT_EXPR:
 765         shift_optab = vec_shl_optab;
 766         break;
 767       default:
 768         gcc_unreachable ();
 769     }
 770
 771   icode = optab_handler (shift_optab, mode);
 772   gcc_assert (icode != CODE_FOR_nothing);
 773
 774   rtx_op1 = expand_normal (vec_oprnd);
 775   rtx_op2 = expand_normal (shift_oprnd);
 776
 777   create_output_operand (&eops[0], target, mode);
 778   create_input_operand (&eops[1], rtx_op1, GET_MODE (rtx_op1));
 779   create_convert_operand_from_type (&eops[2], rtx_op2, TREE_TYPE (shift_oprnd));
 780   expand_insn (icode, 3, eops);
 781
 782   return eops[0].value;
 783 }
 784
 785 /* Create a new vector value in VMODE with all elements set to OP.  The
 786    mode of OP must be the element mode of VMODE.  If OP is a constant,
 787    then the return value will be a constant.  */
 788
 789 static rtx
 790 expand_vector_broadcast (enum machine_mode vmode, rtx op)
 791 {
 792   enum insn_code icode;
 793   rtvec vec;
 794   rtx ret;
 795   int i, n;
 796
 797   gcc_checking_assert (VECTOR_MODE_P (vmode));
 798
 799   n = GET_MODE_NUNITS (vmode);
 800   vec = rtvec_alloc (n);
 801   for (i = 0; i < n; ++i)
 802     RTVEC_ELT (vec, i) = op;
 803
 804   if (CONSTANT_P (op))
 805     return gen_rtx_CONST_VECTOR (vmode, vec);
 806
 807   /* ??? If the target doesn't have a vec_init, then we have no easy way
 808      of performing this operation.  Most of this sort of generic support
 809      is hidden away in the vector lowering support in gimple.  */
 810   icode = optab_handler (vec_init_optab, vmode);
 811   if (icode == CODE_FOR_nothing)
 812     return NULL;
 813
 814   ret = gen_reg_rtx (vmode);
 815   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 816
 817   return ret;
 818 }
 819
 820 /* This subroutine of expand_doubleword_shift handles the cases in which
 821    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 822    value are the same as for the parent routine, except that SUPERWORD_OP1
 823    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 824    INTO_TARGET may be null if the caller has decided to calculate it.  */
 825
 826 static bool
 827 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 828                         rtx outof_target, rtx into_target,
 829                         int unsignedp, enum optab_methods methods)
 830 {
 831   if (into_target != 0)
 832     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 833                              into_target, unsignedp, methods))
 834       return false;
 835
 836   if (outof_target != 0)
 837     {
 838       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 839          of the sign bit, otherwise we must fill it with zeros.  */
 840       if (binoptab != ashr_optab)
 841         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 842       else
 843         if (!force_expand_binop (word_mode, binoptab,
 844                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 845                                  outof_target, unsignedp, methods))
 846           return false;
 847     }
 848   return true;
 849 }
 850
 851 /* This subroutine of expand_doubleword_shift handles the cases in which
 852    the effective shift value is < BITS_PER_WORD.  The arguments and return
 853    value are the same as for the parent routine.  */
 854
 855 static bool
 856 expand_subword_shift (enum machine_mode op1_mode, optab binoptab,
 857                       rtx outof_input, rtx into_input, rtx op1,
 858                       rtx outof_target, rtx into_target,
 859                       int unsignedp, enum optab_methods methods,
 860                       unsigned HOST_WIDE_INT shift_mask)
 861 {
 862   optab reverse_unsigned_shift, unsigned_shift;
 863   rtx tmp, carries;
 864
 865   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 866   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 867
 868   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 869      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 870      the opposite direction to BINOPTAB.  */
 871   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 872     {
 873       carries = outof_input;
 874       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 875                                             op1_mode), op1_mode);
 876       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 877                                    0, true, methods);
 878     }
 879   else
 880     {
 881       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 882          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 883          has unknown behavior.  Do a single shift first, then shift by the
 884          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 885          are truncated to the mode size.  */
 886       carries = expand_binop (word_mode, reverse_unsigned_shift,
 887                               outof_input, const1_rtx, 0, unsignedp, methods);
 888       if (shift_mask == BITS_PER_WORD - 1)
 889         {
 890           tmp = immed_wide_int_const
 891             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 892           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 893                                        0, true, methods);
 894         }
 895       else
 896         {
 897           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 898                                                 op1_mode), op1_mode);
 899           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 900                                        0, true, methods);
 901         }
 902     }
 903   if (tmp == 0 || carries == 0)
 904     return false;
 905   carries = expand_binop (word_mode, reverse_unsigned_shift,
 906                           carries, tmp, 0, unsignedp, methods);
 907   if (carries == 0)
 908     return false;
 909
 910   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 911      so the result can go directly into INTO_TARGET if convenient.  */
 912   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 913                       into_target, unsignedp, methods);
 914   if (tmp == 0)
 915     return false;
 916
 917   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 918   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 919                            into_target, unsignedp, methods))
 920     return false;
 921
 922   /* Use a standard word_mode shift for the out-of half.  */
 923   if (outof_target != 0)
 924     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 925                              outof_target, unsignedp, methods))
 926       return false;
 927
 928   return true;
 929 }
 930
 931
 932 #ifdef HAVE_conditional_move
 933 /* Try implementing expand_doubleword_shift using conditional moves.
 934    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 935    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 936    are the shift counts to use in the former and latter case.  All other
 937    arguments are the same as the parent routine.  */
 938
 939 static bool
 940 expand_doubleword_shift_condmove (enum machine_mode op1_mode, optab binoptab,
 941                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 942                                   rtx outof_input, rtx into_input,
 943                                   rtx subword_op1, rtx superword_op1,
 944                                   rtx outof_target, rtx into_target,
 945                                   int unsignedp, enum optab_methods methods,
 946                                   unsigned HOST_WIDE_INT shift_mask)
 947 {
 948   rtx outof_superword, into_superword;
 949
 950   /* Put the superword version of the output into OUTOF_SUPERWORD and
 951      INTO_SUPERWORD.  */
 952   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 953   if (outof_target != 0 && subword_op1 == superword_op1)
 954     {
 955       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 956          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 957       into_superword = outof_target;
 958       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 959                                    outof_superword, 0, unsignedp, methods))
 960         return false;
 961     }
 962   else
 963     {
 964       into_superword = gen_reg_rtx (word_mode);
 965       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 966                                    outof_superword, into_superword,
 967                                    unsignedp, methods))
 968         return false;
 969     }
 970
 971   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 972   if (!expand_subword_shift (op1_mode, binoptab,
 973                              outof_input, into_input, subword_op1,
 974                              outof_target, into_target,
 975                              unsignedp, methods, shift_mask))
 976     return false;
 977
 978   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 979      might be the current value of OUTOF_TARGET.  */
 980   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 981                               into_target, into_superword, word_mode, false))
 982     return false;
 983
 984   if (outof_target != 0)
 985     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 986                                 outof_target, outof_superword,
 987                                 word_mode, false))
 988       return false;
 989
 990   return true;
 991 }
 992 #endif
 993
 994 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 995    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 996    input operand; the shift moves bits in the direction OUTOF_INPUT->
 997    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 998    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 999    If OP1 is constant, it will have been truncated as appropriate
1000    and is known to be nonzero.
1001
1002    If SHIFT_MASK is zero, the result of word shifts is undefined when the
1003    shift count is outside the range [0, BITS_PER_WORD).  This routine must
1004    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
1005
1006    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
1007    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
1008    fill with zeros or sign bits as appropriate.
1009
1010    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
1011    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
1012    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
1013    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
1014    are undefined.
1015
1016    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
1017    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
1018    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
1019    function wants to calculate it itself.
1020
1021    Return true if the shift could be successfully synthesized.  */
1022
1023 static bool
1024 expand_doubleword_shift (enum machine_mode op1_mode, optab binoptab,
1025                          rtx outof_input, rtx into_input, rtx op1,
1026                          rtx outof_target, rtx into_target,
1027                          int unsignedp, enum optab_methods methods,
1028                          unsigned HOST_WIDE_INT shift_mask)
1029 {
1030   rtx superword_op1, tmp, cmp1, cmp2;
1031   enum rtx_code cmp_code;
1032
1033   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
1034      fill the result with sign or zero bits as appropriate.  If so, the value
1035      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
1036      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
1037      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
1038
1039      This isn't worthwhile for constant shifts since the optimizers will
1040      cope better with in-range shift counts.  */
1041   if (shift_mask >= BITS_PER_WORD
1042       && outof_target != 0
1043       && !CONSTANT_P (op1))
1044     {
1045       if (!expand_doubleword_shift (op1_mode, binoptab,
1046                                     outof_input, into_input, op1,
1047                                     0, into_target,
1048                                     unsignedp, methods, shift_mask))
1049         return false;
1050       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
1051                                outof_target, unsignedp, methods))
1052         return false;
1053       return true;
1054     }
1055
1056   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
1057      is true when the effective shift value is less than BITS_PER_WORD.
1058      Set SUPERWORD_OP1 to the shift count that should be used to shift
1059      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
1060   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
1061   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
1062     {
1063       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
1064          is a subword shift count.  */
1065       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
1066                                     0, true, methods);
1067       cmp2 = CONST0_RTX (op1_mode);
1068       cmp_code = EQ;
1069       superword_op1 = op1;
1070     }
1071   else
1072     {
1073       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
1074       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
1075                                     0, true, methods);
1076       cmp2 = CONST0_RTX (op1_mode);
1077       cmp_code = LT;
1078       superword_op1 = cmp1;
1079     }
1080   if (cmp1 == 0)
1081     return false;
1082
1083   /* If we can compute the condition at compile time, pick the
1084      appropriate subroutine.  */
1085   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
1086   if (tmp != 0 && CONST_INT_P (tmp))
1087     {
1088       if (tmp == const0_rtx)
1089         return expand_superword_shift (binoptab, outof_input, superword_op1,
1090                                        outof_target, into_target,
1091                                        unsignedp, methods);
1092       else
1093         return expand_subword_shift (op1_mode, binoptab,
1094                                      outof_input, into_input, op1,
1095                                      outof_target, into_target,
1096                                      unsignedp, methods, shift_mask);
1097     }
1098
1099 #ifdef HAVE_conditional_move
1100   /* Try using conditional moves to generate straight-line code.  */
1101   {
1102     rtx_insn *start = get_last_insn ();
1103     if (expand_doubleword_shift_condmove (op1_mode, binoptab,
1104                                           cmp_code, cmp1, cmp2,
1105                                           outof_input, into_input,
1106                                           op1, superword_op1,
1107                                           outof_target, into_target,
1108                                           unsignedp, methods, shift_mask))
1109       return true;
1110     delete_insns_since (start);
1111   }
1112 #endif
1113
1114   /* As a last resort, use branches to select the correct alternative.  */
1115   rtx_code_label *subword_label = gen_label_rtx ();
1116   rtx_code_label *done_label = gen_label_rtx ();
1117
1118   NO_DEFER_POP;
1119   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
1120                            0, 0, subword_label, -1);
1121   OK_DEFER_POP;
1122
1123   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
1124                                outof_target, into_target,
1125                                unsignedp, methods))
1126     return false;
1127
1128   emit_jump_insn (gen_jump (done_label));
1129   emit_barrier ();
1130   emit_label (subword_label);
1131
1132   if (!expand_subword_shift (op1_mode, binoptab,
1133                              outof_input, into_input, op1,
1134                              outof_target, into_target,
1135                              unsignedp, methods, shift_mask))
1136     return false;
1137
1138   emit_label (done_label);
1139   return true;
1140 }
1141 \f
1142 /* Subroutine of expand_binop.  Perform a double word multiplication of
1143    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
1144    as the target's word_mode.  This function return NULL_RTX if anything
1145    goes wrong, in which case it may have already emitted instructions
1146    which need to be deleted.
1147
1148    If we want to multiply two two-word values and have normal and widening
1149    multiplies of single-word values, we can do this with three smaller
1150    multiplications.
1151
1152    The multiplication proceeds as follows:
1153                                  _______________________
1154                                 [__op0_high_|__op0_low__]
1155                                  _______________________
1156         *                       [__op1_high_|__op1_low__]
1157         _______________________________________________
1158                                  _______________________
1159     (1)                         [__op0_low__*__op1_low__]
1160                      _______________________
1161     (2a)            [__op0_low__*__op1_high_]
1162                      _______________________
1163     (2b)            [__op0_high_*__op1_low__]
1164          _______________________
1165     (3) [__op0_high_*__op1_high_]
1166
1167
1168   This gives a 4-word result.  Since we are only interested in the
1169   lower 2 words, partial result (3) and the upper words of (2a) and
1170   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
1171   calculated using non-widening multiplication.
1172
1173   (1), however, needs to be calculated with an unsigned widening
1174   multiplication.  If this operation is not directly supported we
1175   try using a signed widening multiplication and adjust the result.
1176   This adjustment works as follows:
1177
1178       If both operands are positive then no adjustment is needed.
1179
1180       If the operands have different signs, for example op0_low < 0 and
1181       op1_low >= 0, the instruction treats the most significant bit of
1182       op0_low as a sign bit instead of a bit with significance
1183       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
1184       with 2**BITS_PER_WORD - op0_low, and two's complements the
1185       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
1186       the result.
1187
1188       Similarly, if both operands are negative, we need to add
1189       (op0_low + op1_low) * 2**BITS_PER_WORD.
1190
1191       We use a trick to adjust quickly.  We logically shift op0_low right
1192       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
1193       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
1194       logical shift exists, we do an arithmetic right shift and subtract
1195       the 0 or -1.  */
1196
1197 static rtx
1198 expand_doubleword_mult (enum machine_mode mode, rtx op0, rtx op1, rtx target,
1199                        bool umulp, enum optab_methods methods)
1200 {
1201   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
1202   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
1203   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
1204   rtx product, adjust, product_high, temp;
1205
1206   rtx op0_high = operand_subword_force (op0, high, mode);
1207   rtx op0_low = operand_subword_force (op0, low, mode);
1208   rtx op1_high = operand_subword_force (op1, high, mode);
1209   rtx op1_low = operand_subword_force (op1, low, mode);
1210
1211   /* If we're using an unsigned multiply to directly compute the product
1212      of the low-order words of the operands and perform any required
1213      adjustments of the operands, we begin by trying two more multiplications
1214      and then computing the appropriate sum.
1215
1216      We have checked above that the required addition is provided.
1217      Full-word addition will normally always succeed, especially if
1218      it is provided at all, so we don't worry about its failure.  The
1219      multiplication may well fail, however, so we do handle that.  */
1220
1221   if (!umulp)
1222     {
1223       /* ??? This could be done with emit_store_flag where available.  */
1224       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
1225                            NULL_RTX, 1, methods);
1226       if (temp)
1227         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
1228                                  NULL_RTX, 0, OPTAB_DIRECT);
1229       else
1230         {
1231           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
1232                                NULL_RTX, 0, methods);
1233           if (!temp)
1234             return NULL_RTX;
1235           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
1236                                    NULL_RTX, 0, OPTAB_DIRECT);
1237         }
1238
1239       if (!op0_high)
1240         return NULL_RTX;
1241     }
1242
1243   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
1244                          NULL_RTX, 0, OPTAB_DIRECT);
1245   if (!adjust)
1246     return NULL_RTX;
1247
1248   /* OP0_HIGH should now be dead.  */
1249
1250   if (!umulp)
1251     {
1252       /* ??? This could be done with emit_store_flag where available.  */
1253       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
1254                            NULL_RTX, 1, methods);
1255       if (temp)
1256         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
1257                                  NULL_RTX, 0, OPTAB_DIRECT);
1258       else
1259         {
1260           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
1261                                NULL_RTX, 0, methods);
1262           if (!temp)
1263             return NULL_RTX;
1264           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
1265                                    NULL_RTX, 0, OPTAB_DIRECT);
1266         }
1267
1268       if (!op1_high)
1269         return NULL_RTX;
1270     }
1271
1272   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
1273                        NULL_RTX, 0, OPTAB_DIRECT);
1274   if (!temp)
1275     return NULL_RTX;
1276
1277   /* OP1_HIGH should now be dead.  */
1278
1279   adjust = expand_binop (word_mode, add_optab, adjust, temp,
1280                          NULL_RTX, 0, OPTAB_DIRECT);
1281
1282   if (target && !REG_P (target))
1283     target = NULL_RTX;
1284
1285   if (umulp)
1286     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
1287                             target, 1, OPTAB_DIRECT);
1288   else
1289     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
1290                             target, 1, OPTAB_DIRECT);
1291
1292   if (!product)
1293     return NULL_RTX;
1294
1295   product_high = operand_subword (product, high, 1, mode);
1296   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
1297                          NULL_RTX, 0, OPTAB_DIRECT);
1298   emit_move_insn (product_high, adjust);
1299   return product;
1300 }
1301 \f
1302 /* Wrapper around expand_binop which takes an rtx code to specify
1303    the operation to perform, not an optab pointer.  All other
1304    arguments are the same.  */
1305 rtx
1306 expand_simple_binop (enum machine_mode mode, enum rtx_code code, rtx op0,
1307                      rtx op1, rtx target, int unsignedp,
1308                      enum optab_methods methods)
1309 {
1310   optab binop = code_to_optab (code);
1311   gcc_assert (binop);
1312
1313   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
1314 }
1315
1316 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
1317    binop.  Order them according to commutative_operand_precedence and, if
1318    possible, try to put TARGET or a pseudo first.  */
1319 static bool
1320 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
1321 {
1322   int op0_prec = commutative_operand_precedence (op0);
1323   int op1_prec = commutative_operand_precedence (op1);
1324
1325   if (op0_prec < op1_prec)
1326     return true;
1327
1328   if (op0_prec > op1_prec)
1329     return false;
1330
1331   /* With equal precedence, both orders are ok, but it is better if the
1332      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
1333   if (target == 0 || REG_P (target))
1334     return (REG_P (op1) && !REG_P (op0)) || target == op1;
1335   else
1336     return rtx_equal_p (op1, target);
1337 }
1338
1339 /* Return true if BINOPTAB implements a shift operation.  */
1340
1341 static bool
1342 shift_optab_p (optab binoptab)
1343 {
1344   switch (optab_to_code (binoptab))
1345     {
1346     case ASHIFT:
1347     case SS_ASHIFT:
1348     case US_ASHIFT:
1349     case ASHIFTRT:
1350     case LSHIFTRT:
1351     case ROTATE:
1352     case ROTATERT:
1353       return true;
1354
1355     default:
1356       return false;
1357     }
1358 }
1359
1360 /* Return true if BINOPTAB implements a commutative binary operation.  */
1361
1362 static bool
1363 commutative_optab_p (optab binoptab)
1364 {
1365   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
1366           || binoptab == smul_widen_optab
1367           || binoptab == umul_widen_optab
1368           || binoptab == smul_highpart_optab
1369           || binoptab == umul_highpart_optab);
1370 }
1371
1372 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
1373    optimizing, and if the operand is a constant that costs more than
1374    1 instruction, force the constant into a register and return that
1375    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
1376
1377 static rtx
1378 avoid_expensive_constant (enum machine_mode mode, optab binoptab,
1379                           int opn, rtx x, bool unsignedp)
1380 {
1381   bool speed = optimize_insn_for_speed_p ();
1382
1383   if (mode != VOIDmode
1384       && optimize
1385       && CONSTANT_P (x)
1386       && (rtx_cost (x, optab_to_code (binoptab), opn, speed)
1387           > set_src_cost (x, speed)))
1388     {
1389       if (CONST_INT_P (x))
1390         {
1391           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
1392           if (intval != INTVAL (x))
1393             x = GEN_INT (intval);
1394         }
1395       else
1396         x = convert_modes (mode, VOIDmode, x, unsignedp);
1397       x = force_reg (mode, x);
1398     }
1399   return x;
1400 }
1401
1402 /* Helper function for expand_binop: handle the case where there
1403    is an insn that directly implements the indicated operation.
1404    Returns null if this is not possible.  */
1405 static rtx
1406 expand_binop_directly (enum machine_mode mode, optab binoptab,
1407                        rtx op0, rtx op1,
1408                        rtx target, int unsignedp, enum optab_methods methods,
1409                        rtx_insn *last)
1410 {
1411   enum machine_mode from_mode = widened_mode (mode, op0, op1);
1412   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
1413                                                       from_mode, 1);
1414   enum machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1415   enum machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1416   enum machine_mode mode0, mode1, tmp_mode;
1417   struct expand_operand ops[3];
1418   bool commutative_p;
1419   rtx pat;
1420   rtx xop0 = op0, xop1 = op1;
1421   rtx swap;
1422
1423   /* If it is a commutative operator and the modes would match
1424      if we would swap the operands, we can save the conversions.  */
1425   commutative_p = commutative_optab_p (binoptab);
1426   if (commutative_p
1427       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1428       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1429     {
1430       swap = xop0;
1431       xop0 = xop1;
1432       xop1 = swap;
1433     }
1434
1435   /* If we are optimizing, force expensive constants into a register.  */
1436   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1437   if (!shift_optab_p (binoptab))
1438     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1439
1440   /* In case the insn wants input operands in modes different from
1441      those of the actual operands, convert the operands.  It would
1442      seem that we don't need to convert CONST_INTs, but we do, so
1443      that they're properly zero-extended, sign-extended or truncated
1444      for their mode.  */
1445
1446   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1447   if (xmode0 != VOIDmode && xmode0 != mode0)
1448     {
1449       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1450       mode0 = xmode0;
1451     }
1452
1453   mode1 = GET_MODE (xop1) != VOIDmode ? GET_MODE (xop1) : mode;
1454   if (xmode1 != VOIDmode && xmode1 != mode1)
1455     {
1456       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1457       mode1 = xmode1;
1458     }
1459
1460   /* If operation is commutative,
1461      try to make the first operand a register.
1462      Even better, try to make it the same as the target.
1463      Also try to make the last operand a constant.  */
1464   if (commutative_p
1465       && swap_commutative_operands_with_target (target, xop0, xop1))
1466     {
1467       swap = xop1;
1468       xop1 = xop0;
1469       xop0 = swap;
1470     }
1471
1472   /* Now, if insn's predicates don't allow our operands, put them into
1473      pseudo regs.  */
1474
1475   if (binoptab == vec_pack_trunc_optab
1476       || binoptab == vec_pack_usat_optab
1477       || binoptab == vec_pack_ssat_optab
1478       || binoptab == vec_pack_ufix_trunc_optab
1479       || binoptab == vec_pack_sfix_trunc_optab)
1480     {
1481       /* The mode of the result is different then the mode of the
1482          arguments.  */
1483       tmp_mode = insn_data[(int) icode].operand[0].mode;
1484       if (GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1485         {
1486           delete_insns_since (last);
1487           return NULL_RTX;
1488         }
1489     }
1490   else
1491     tmp_mode = mode;
1492
1493   create_output_operand (&ops[0], target, tmp_mode);
1494   create_input_operand (&ops[1], xop0, mode0);
1495   create_input_operand (&ops[2], xop1, mode1);
1496   pat = maybe_gen_insn (icode, 3, ops);
1497   if (pat)
1498     {
1499       /* If PAT is composed of more than one insn, try to add an appropriate
1500          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1501          operand, call expand_binop again, this time without a target.  */
1502       if (INSN_P (pat) && NEXT_INSN (as_a <rtx_insn *> (pat)) != NULL_RTX
1503           && ! add_equal_note (as_a <rtx_insn *> (pat), ops[0].value,
1504                                optab_to_code (binoptab),
1505                                ops[1].value, ops[2].value))
1506         {
1507           delete_insns_since (last);
1508           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1509                                unsignedp, methods);
1510         }
1511
1512       emit_insn (pat);
1513       return ops[0].value;
1514     }
1515   delete_insns_since (last);
1516   return NULL_RTX;
1517 }
1518
1519 /* Generate code to perform an operation specified by BINOPTAB
1520    on operands OP0 and OP1, with result having machine-mode MODE.
1521
1522    UNSIGNEDP is for the case where we have to widen the operands
1523    to perform the operation.  It says to use zero-extension.
1524
1525    If TARGET is nonzero, the value
1526    is generated there, if it is convenient to do so.
1527    In all cases an rtx is returned for the locus of the value;
1528    this may or may not be TARGET.  */
1529
1530 rtx
1531 expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
1532               rtx target, int unsignedp, enum optab_methods methods)
1533 {
1534   enum optab_methods next_methods
1535     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1536        ? OPTAB_WIDEN : methods);
1537   enum mode_class mclass;
1538   enum machine_mode wider_mode;
1539   rtx libfunc;
1540   rtx temp;
1541   rtx_insn *entry_last = get_last_insn ();
1542   rtx_insn *last;
1543
1544   mclass = GET_MODE_CLASS (mode);
1545
1546   /* If subtracting an integer constant, convert this into an addition of
1547      the negated constant.  */
1548
1549   if (binoptab == sub_optab && CONST_INT_P (op1))
1550     {
1551       op1 = negate_rtx (mode, op1);
1552       binoptab = add_optab;
1553     }
1554
1555   /* Record where to delete back to if we backtrack.  */
1556   last = get_last_insn ();
1557
1558   /* If we can do it with a three-operand insn, do so.  */
1559
1560   if (methods != OPTAB_MUST_WIDEN
1561       && find_widening_optab_handler (binoptab, mode,
1562                                       widened_mode (mode, op0, op1), 1)
1563             != CODE_FOR_nothing)
1564     {
1565       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1566                                     unsignedp, methods, last);
1567       if (temp)
1568         return temp;
1569     }
1570
1571   /* If we were trying to rotate, and that didn't work, try rotating
1572      the other direction before falling back to shifts and bitwise-or.  */
1573   if (((binoptab == rotl_optab
1574         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1575        || (binoptab == rotr_optab
1576            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1577       && mclass == MODE_INT)
1578     {
1579       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1580       rtx newop1;
1581       unsigned int bits = GET_MODE_PRECISION (mode);
1582
1583       if (CONST_INT_P (op1))
1584         newop1 = GEN_INT (bits - INTVAL (op1));
1585       else if (targetm.shift_truncation_mask (mode) == bits - 1)
1586         newop1 = negate_rtx (GET_MODE (op1), op1);
1587       else
1588         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1589                                gen_int_mode (bits, GET_MODE (op1)), op1,
1590                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1591
1592       temp = expand_binop_directly (mode, otheroptab, op0, newop1,
1593                                     target, unsignedp, methods, last);
1594       if (temp)
1595         return temp;
1596     }
1597
1598   /* If this is a multiply, see if we can do a widening operation that
1599      takes operands of this mode and makes a wider mode.  */
1600
1601   if (binoptab == smul_optab
1602       && GET_MODE_2XWIDER_MODE (mode) != VOIDmode
1603       && (widening_optab_handler ((unsignedp ? umul_widen_optab
1604                                              : smul_widen_optab),
1605                                   GET_MODE_2XWIDER_MODE (mode), mode)
1606           != CODE_FOR_nothing))
1607     {
1608       temp = expand_binop (GET_MODE_2XWIDER_MODE (mode),
1609                            unsignedp ? umul_widen_optab : smul_widen_optab,
1610                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1611
1612       if (temp != 0)
1613         {
1614           if (GET_MODE_CLASS (mode) == MODE_INT
1615               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1616             return gen_lowpart (mode, temp);
1617           else
1618             return convert_to_mode (mode, temp, unsignedp);
1619         }
1620     }
1621
1622   /* If this is a vector shift by a scalar, see if we can do a vector
1623      shift by a vector.  If so, broadcast the scalar into a vector.  */
1624   if (mclass == MODE_VECTOR_INT)
1625     {
1626       optab otheroptab = unknown_optab;
1627
1628       if (binoptab == ashl_optab)
1629         otheroptab = vashl_optab;
1630       else if (binoptab == ashr_optab)
1631         otheroptab = vashr_optab;
1632       else if (binoptab == lshr_optab)
1633         otheroptab = vlshr_optab;
1634       else if (binoptab == rotl_optab)
1635         otheroptab = vrotl_optab;
1636       else if (binoptab == rotr_optab)
1637         otheroptab = vrotr_optab;
1638
1639       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1640         {
1641           rtx vop1 = expand_vector_broadcast (mode, op1);
1642           if (vop1)
1643             {
1644               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1645                                             target, unsignedp, methods, last);
1646               if (temp)
1647                 return temp;
1648             }
1649         }
1650     }
1651
1652   /* Look for a wider mode of the same class for which we think we
1653      can open-code the operation.  Check for a widening multiply at the
1654      wider mode as well.  */
1655
1656   if (CLASS_HAS_WIDER_MODES_P (mclass)
1657       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1658     for (wider_mode = GET_MODE_WIDER_MODE (mode);
1659          wider_mode != VOIDmode;
1660          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
1661       {
1662         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1663             || (binoptab == smul_optab
1664                 && GET_MODE_WIDER_MODE (wider_mode) != VOIDmode
1665                 && (find_widening_optab_handler ((unsignedp
1666                                                   ? umul_widen_optab
1667                                                   : smul_widen_optab),
1668                                                  GET_MODE_WIDER_MODE (wider_mode),
1669                                                  mode, 0)
1670                     != CODE_FOR_nothing)))
1671           {
1672             rtx xop0 = op0, xop1 = op1;
1673             int no_extend = 0;
1674
1675             /* For certain integer operations, we need not actually extend
1676                the narrow operands, as long as we will truncate
1677                the results to the same narrowness.  */
1678
1679             if ((binoptab == ior_optab || binoptab == and_optab
1680                  || binoptab == xor_optab
1681                  || binoptab == add_optab || binoptab == sub_optab
1682                  || binoptab == smul_optab || binoptab == ashl_optab)
1683                 && mclass == MODE_INT)
1684               {
1685                 no_extend = 1;
1686                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1687                                                  xop0, unsignedp);
1688                 if (binoptab != ashl_optab)
1689                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1690                                                    xop1, unsignedp);
1691               }
1692
1693             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1694
1695             /* The second operand of a shift must always be extended.  */
1696             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1697                                   no_extend && binoptab != ashl_optab);
1698
1699             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1700                                  unsignedp, OPTAB_DIRECT);
1701             if (temp)
1702               {
1703                 if (mclass != MODE_INT
1704                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1705                   {
1706                     if (target == 0)
1707                       target = gen_reg_rtx (mode);
1708                     convert_move (target, temp, 0);
1709                     return target;
1710                   }
1711                 else
1712                   return gen_lowpart (mode, temp);
1713               }
1714             else
1715               delete_insns_since (last);
1716           }
1717       }
1718
1719   /* If operation is commutative,
1720      try to make the first operand a register.
1721      Even better, try to make it the same as the target.
1722      Also try to make the last operand a constant.  */
1723   if (commutative_optab_p (binoptab)
1724       && swap_commutative_operands_with_target (target, op0, op1))
1725     {
1726       temp = op1;
1727       op1 = op0;
1728       op0 = temp;
1729     }
1730
1731   /* These can be done a word at a time.  */
1732   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1733       && mclass == MODE_INT
1734       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
1735       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1736     {
1737       int i;
1738       rtx_insn *insns;
1739
1740       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1741          won't be accurate, so use a new target.  */
1742       if (target == 0
1743           || target == op0
1744           || target == op1
1745           || !valid_multiword_target_p (target))
1746         target = gen_reg_rtx (mode);
1747
1748       start_sequence ();
1749
1750       /* Do the actual arithmetic.  */
1751       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
1752         {
1753           rtx target_piece = operand_subword (target, i, 1, mode);
1754           rtx x = expand_binop (word_mode, binoptab,
1755                                 operand_subword_force (op0, i, mode),
1756                                 operand_subword_force (op1, i, mode),
1757                                 target_piece, unsignedp, next_methods);
1758
1759           if (x == 0)
1760             break;
1761
1762           if (target_piece != x)
1763             emit_move_insn (target_piece, x);
1764         }
1765
1766       insns = get_insns ();
1767       end_sequence ();
1768
1769       if (i == GET_MODE_BITSIZE (mode) / BITS_PER_WORD)
1770         {
1771           emit_insn (insns);
1772           return target;
1773         }
1774     }
1775
1776   /* Synthesize double word shifts from single word shifts.  */
1777   if ((binoptab == lshr_optab || binoptab == ashl_optab
1778        || binoptab == ashr_optab)
1779       && mclass == MODE_INT
1780       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1781       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1782       && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode)
1783       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1784       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1785       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1786     {
1787       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1788       enum machine_mode op1_mode;
1789
1790       double_shift_mask = targetm.shift_truncation_mask (mode);
1791       shift_mask = targetm.shift_truncation_mask (word_mode);
1792       op1_mode = GET_MODE (op1) != VOIDmode ? GET_MODE (op1) : word_mode;
1793
1794       /* Apply the truncation to constant shifts.  */
1795       if (double_shift_mask > 0 && CONST_INT_P (op1))
1796         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1797
1798       if (op1 == CONST0_RTX (op1_mode))
1799         return op0;
1800
1801       /* Make sure that this is a combination that expand_doubleword_shift
1802          can handle.  See the comments there for details.  */
1803       if (double_shift_mask == 0
1804           || (shift_mask == BITS_PER_WORD - 1
1805               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1806         {
1807           rtx_insn *insns;
1808           rtx into_target, outof_target;
1809           rtx into_input, outof_input;
1810           int left_shift, outof_word;
1811
1812           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1813              won't be accurate, so use a new target.  */
1814           if (target == 0
1815               || target == op0
1816               || target == op1
1817               || !valid_multiword_target_p (target))
1818             target = gen_reg_rtx (mode);
1819
1820           start_sequence ();
1821
1822           /* OUTOF_* is the word we are shifting bits away from, and
1823              INTO_* is the word that we are shifting bits towards, thus
1824              they differ depending on the direction of the shift and
1825              WORDS_BIG_ENDIAN.  */
1826
1827           left_shift = binoptab == ashl_optab;
1828           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1829
1830           outof_target = operand_subword (target, outof_word, 1, mode);
1831           into_target = operand_subword (target, 1 - outof_word, 1, mode);
1832
1833           outof_input = operand_subword_force (op0, outof_word, mode);
1834           into_input = operand_subword_force (op0, 1 - outof_word, mode);
1835
1836           if (expand_doubleword_shift (op1_mode, binoptab,
1837                                        outof_input, into_input, op1,
1838                                        outof_target, into_target,
1839                                        unsignedp, next_methods, shift_mask))
1840             {
1841               insns = get_insns ();
1842               end_sequence ();
1843
1844               emit_insn (insns);
1845               return target;
1846             }
1847           end_sequence ();
1848         }
1849     }
1850
1851   /* Synthesize double word rotates from single word shifts.  */
1852   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1853       && mclass == MODE_INT
1854       && CONST_INT_P (op1)
1855       && GET_MODE_PRECISION (mode) == 2 * BITS_PER_WORD
1856       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1857       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1858     {
1859       rtx_insn *insns;
1860       rtx into_target, outof_target;
1861       rtx into_input, outof_input;
1862       rtx inter;
1863       int shift_count, left_shift, outof_word;
1864
1865       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1866          won't be accurate, so use a new target. Do this also if target is not
1867          a REG, first because having a register instead may open optimization
1868          opportunities, and second because if target and op0 happen to be MEMs
1869          designating the same location, we would risk clobbering it too early
1870          in the code sequence we generate below.  */
1871       if (target == 0
1872           || target == op0
1873           || target == op1
1874           || !REG_P (target)
1875           || !valid_multiword_target_p (target))
1876         target = gen_reg_rtx (mode);
1877
1878       start_sequence ();
1879
1880       shift_count = INTVAL (op1);
1881
1882       /* OUTOF_* is the word we are shifting bits away from, and
1883          INTO_* is the word that we are shifting bits towards, thus
1884          they differ depending on the direction of the shift and
1885          WORDS_BIG_ENDIAN.  */
1886
1887       left_shift = (binoptab == rotl_optab);
1888       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1889
1890       outof_target = operand_subword (target, outof_word, 1, mode);
1891       into_target = operand_subword (target, 1 - outof_word, 1, mode);
1892
1893       outof_input = operand_subword_force (op0, outof_word, mode);
1894       into_input = operand_subword_force (op0, 1 - outof_word, mode);
1895
1896       if (shift_count == BITS_PER_WORD)
1897         {
1898           /* This is just a word swap.  */
1899           emit_move_insn (outof_target, into_input);
1900           emit_move_insn (into_target, outof_input);
1901           inter = const0_rtx;
1902         }
1903       else
1904         {
1905           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1906           rtx first_shift_count, second_shift_count;
1907           optab reverse_unsigned_shift, unsigned_shift;
1908
1909           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1910                                     ? lshr_optab : ashl_optab);
1911
1912           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1913                             ? ashl_optab : lshr_optab);
1914
1915           if (shift_count > BITS_PER_WORD)
1916             {
1917               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1918               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1919             }
1920           else
1921             {
1922               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1923               second_shift_count = GEN_INT (shift_count);
1924             }
1925
1926           into_temp1 = expand_binop (word_mode, unsigned_shift,
1927                                      outof_input, first_shift_count,
1928                                      NULL_RTX, unsignedp, next_methods);
1929           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1930                                      into_input, second_shift_count,
1931                                      NULL_RTX, unsignedp, next_methods);
1932
1933           if (into_temp1 != 0 && into_temp2 != 0)
1934             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1935                                   into_target, unsignedp, next_methods);
1936           else
1937             inter = 0;
1938
1939           if (inter != 0 && inter != into_target)
1940             emit_move_insn (into_target, inter);
1941
1942           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1943                                       into_input, first_shift_count,
1944                                       NULL_RTX, unsignedp, next_methods);
1945           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1946                                       outof_input, second_shift_count,
1947                                       NULL_RTX, unsignedp, next_methods);
1948
1949           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1950             inter = expand_binop (word_mode, ior_optab,
1951                                   outof_temp1, outof_temp2,
1952                                   outof_target, unsignedp, next_methods);
1953
1954           if (inter != 0 && inter != outof_target)
1955             emit_move_insn (outof_target, inter);
1956         }
1957
1958       insns = get_insns ();
1959       end_sequence ();
1960
1961       if (inter != 0)
1962         {
1963           emit_insn (insns);
1964           return target;
1965         }
1966     }
1967
1968   /* These can be done a word at a time by propagating carries.  */
1969   if ((binoptab == add_optab || binoptab == sub_optab)
1970       && mclass == MODE_INT
1971       && GET_MODE_SIZE (mode) >= 2 * UNITS_PER_WORD
1972       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1973     {
1974       unsigned int i;
1975       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1976       const unsigned int nwords = GET_MODE_BITSIZE (mode) / BITS_PER_WORD;
1977       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1978       rtx xop0, xop1, xtarget;
1979
1980       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1981          value is one of those, use it.  Otherwise, use 1 since it is the
1982          one easiest to get.  */
1983 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1984       int normalizep = STORE_FLAG_VALUE;
1985 #else
1986       int normalizep = 1;
1987 #endif
1988
1989       /* Prepare the operands.  */
1990       xop0 = force_reg (mode, op0);
1991       xop1 = force_reg (mode, op1);
1992
1993       xtarget = gen_reg_rtx (mode);
1994
1995       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1996         target = xtarget;
1997
1998       /* Indicate for flow that the entire target reg is being set.  */
1999       if (REG_P (target))
2000         emit_clobber (xtarget);
2001
2002       /* Do the actual arithmetic.  */
2003       for (i = 0; i < nwords; i++)
2004         {
2005           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
2006           rtx target_piece = operand_subword (xtarget, index, 1, mode);
2007           rtx op0_piece = operand_subword_force (xop0, index, mode);
2008           rtx op1_piece = operand_subword_force (xop1, index, mode);
2009           rtx x;
2010
2011           /* Main add/subtract of the input operands.  */
2012           x = expand_binop (word_mode, binoptab,
2013                             op0_piece, op1_piece,
2014                             target_piece, unsignedp, next_methods);
2015           if (x == 0)
2016             break;
2017
2018           if (i + 1 < nwords)
2019             {
2020               /* Store carry from main add/subtract.  */
2021               carry_out = gen_reg_rtx (word_mode);
2022               carry_out = emit_store_flag_force (carry_out,
2023                                                  (binoptab == add_optab
2024                                                   ? LT : GT),
2025                                                  x, op0_piece,
2026                                                  word_mode, 1, normalizep);
2027             }
2028
2029           if (i > 0)
2030             {
2031               rtx newx;
2032
2033               /* Add/subtract previous carry to main result.  */
2034               newx = expand_binop (word_mode,
2035                                    normalizep == 1 ? binoptab : otheroptab,
2036                                    x, carry_in,
2037                                    NULL_RTX, 1, next_methods);
2038
2039               if (i + 1 < nwords)
2040                 {
2041                   /* Get out carry from adding/subtracting carry in.  */
2042                   rtx carry_tmp = gen_reg_rtx (word_mode);
2043                   carry_tmp = emit_store_flag_force (carry_tmp,
2044                                                      (binoptab == add_optab
2045                                                       ? LT : GT),
2046                                                      newx, x,
2047                                                      word_mode, 1, normalizep);
2048
2049                   /* Logical-ior the two poss. carry together.  */
2050                   carry_out = expand_binop (word_mode, ior_optab,
2051                                             carry_out, carry_tmp,
2052                                             carry_out, 0, next_methods);
2053                   if (carry_out == 0)
2054                     break;
2055                 }
2056               emit_move_insn (target_piece, newx);
2057             }
2058           else
2059             {
2060               if (x != target_piece)
2061                 emit_move_insn (target_piece, x);
2062             }
2063
2064           carry_in = carry_out;
2065         }
2066
2067       if (i == GET_MODE_BITSIZE (mode) / (unsigned) BITS_PER_WORD)
2068         {
2069           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing
2070               || ! rtx_equal_p (target, xtarget))
2071             {
2072               rtx temp = emit_move_insn (target, xtarget);
2073
2074               set_dst_reg_note (temp, REG_EQUAL,
2075                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2076                                                 mode, copy_rtx (xop0),
2077                                                 copy_rtx (xop1)),
2078                                 target);
2079             }
2080           else
2081             target = xtarget;
2082
2083           return target;
2084         }
2085
2086       else
2087         delete_insns_since (last);
2088     }
2089
2090   /* Attempt to synthesize double word multiplies using a sequence of word
2091      mode multiplications.  We first attempt to generate a sequence using a
2092      more efficient unsigned widening multiply, and if that fails we then
2093      try using a signed widening multiply.  */
2094
2095   if (binoptab == smul_optab
2096       && mclass == MODE_INT
2097       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2098       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
2099       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
2100     {
2101       rtx product = NULL_RTX;
2102       if (widening_optab_handler (umul_widen_optab, mode, word_mode)
2103             != CODE_FOR_nothing)
2104         {
2105           product = expand_doubleword_mult (mode, op0, op1, target,
2106                                             true, methods);
2107           if (!product)
2108             delete_insns_since (last);
2109         }
2110
2111       if (product == NULL_RTX
2112           && widening_optab_handler (smul_widen_optab, mode, word_mode)
2113                 != CODE_FOR_nothing)
2114         {
2115           product = expand_doubleword_mult (mode, op0, op1, target,
2116                                             false, methods);
2117           if (!product)
2118             delete_insns_since (last);
2119         }
2120
2121       if (product != NULL_RTX)
2122         {
2123           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing)
2124             {
2125               temp = emit_move_insn (target ? target : product, product);
2126               set_dst_reg_note (temp,
2127                                 REG_EQUAL,
2128                                 gen_rtx_fmt_ee (MULT, mode,
2129                                                 copy_rtx (op0),
2130                                                 copy_rtx (op1)),
2131                                 target ? target : product);
2132             }
2133           return product;
2134         }
2135     }
2136
2137   /* It can't be open-coded in this mode.
2138      Use a library call if one is available and caller says that's ok.  */
2139
2140   libfunc = optab_libfunc (binoptab, mode);
2141   if (libfunc
2142       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
2143     {
2144       rtx_insn *insns;
2145       rtx op1x = op1;
2146       enum machine_mode op1_mode = mode;
2147       rtx value;
2148
2149       start_sequence ();
2150
2151       if (shift_optab_p (binoptab))
2152         {
2153           op1_mode = targetm.libgcc_shift_count_mode ();
2154           /* Specify unsigned here,
2155              since negative shift counts are meaningless.  */
2156           op1x = convert_to_mode (op1_mode, op1, 1);
2157         }
2158
2159       if (GET_MODE (op0) != VOIDmode
2160           && GET_MODE (op0) != mode)
2161         op0 = convert_to_mode (mode, op0, unsignedp);
2162
2163       /* Pass 1 for NO_QUEUE so we don't lose any increments
2164          if the libcall is cse'd or moved.  */
2165       value = emit_library_call_value (libfunc,
2166                                        NULL_RTX, LCT_CONST, mode, 2,
2167                                        op0, mode, op1x, op1_mode);
2168
2169       insns = get_insns ();
2170       end_sequence ();
2171
2172       target = gen_reg_rtx (mode);
2173       emit_libcall_block_1 (insns, target, value,
2174                             gen_rtx_fmt_ee (optab_to_code (binoptab),
2175                                             mode, op0, op1),
2176                             trapv_binoptab_p (binoptab));
2177
2178       return target;
2179     }
2180
2181   delete_insns_since (last);
2182
2183   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2184
2185   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
2186          || methods == OPTAB_MUST_WIDEN))
2187     {
2188       /* Caller says, don't even try.  */
2189       delete_insns_since (entry_last);
2190       return 0;
2191     }
2192
2193   /* Compute the value of METHODS to pass to recursive calls.
2194      Don't allow widening to be tried recursively.  */
2195
2196   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
2197
2198   /* Look for a wider mode of the same class for which it appears we can do
2199      the operation.  */
2200
2201   if (CLASS_HAS_WIDER_MODES_P (mclass))
2202     {
2203       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2204            wider_mode != VOIDmode;
2205            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2206         {
2207           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
2208                   != CODE_FOR_nothing
2209               || (methods == OPTAB_LIB
2210                   && optab_libfunc (binoptab, wider_mode)))
2211             {
2212               rtx xop0 = op0, xop1 = op1;
2213               int no_extend = 0;
2214
2215               /* For certain integer operations, we need not actually extend
2216                  the narrow operands, as long as we will truncate
2217                  the results to the same narrowness.  */
2218
2219               if ((binoptab == ior_optab || binoptab == and_optab
2220                    || binoptab == xor_optab
2221                    || binoptab == add_optab || binoptab == sub_optab
2222                    || binoptab == smul_optab || binoptab == ashl_optab)
2223                   && mclass == MODE_INT)
2224                 no_extend = 1;
2225
2226               xop0 = widen_operand (xop0, wider_mode, mode,
2227                                     unsignedp, no_extend);
2228
2229               /* The second operand of a shift must always be extended.  */
2230               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
2231                                     no_extend && binoptab != ashl_optab);
2232
2233               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
2234                                    unsignedp, methods);
2235               if (temp)
2236                 {
2237                   if (mclass != MODE_INT
2238                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2239                     {
2240                       if (target == 0)
2241                         target = gen_reg_rtx (mode);
2242                       convert_move (target, temp, 0);
2243                       return target;
2244                     }
2245                   else
2246                     return gen_lowpart (mode, temp);
2247                 }
2248               else
2249                 delete_insns_since (last);
2250             }
2251         }
2252     }
2253
2254   delete_insns_since (entry_last);
2255   return 0;
2256 }
2257 \f
2258 /* Expand a binary operator which has both signed and unsigned forms.
2259    UOPTAB is the optab for unsigned operations, and SOPTAB is for
2260    signed operations.
2261
2262    If we widen unsigned operands, we may use a signed wider operation instead
2263    of an unsigned wider operation, since the result would be the same.  */
2264
2265 rtx
2266 sign_expand_binop (enum machine_mode mode, optab uoptab, optab soptab,
2267                    rtx op0, rtx op1, rtx target, int unsignedp,
2268                    enum optab_methods methods)
2269 {
2270   rtx temp;
2271   optab direct_optab = unsignedp ? uoptab : soptab;
2272   bool save_enable;
2273
2274   /* Do it without widening, if possible.  */
2275   temp = expand_binop (mode, direct_optab, op0, op1, target,
2276                        unsignedp, OPTAB_DIRECT);
2277   if (temp || methods == OPTAB_DIRECT)
2278     return temp;
2279
2280   /* Try widening to a signed int.  Disable any direct use of any
2281      signed insn in the current mode.  */
2282   save_enable = swap_optab_enable (soptab, mode, false);
2283
2284   temp = expand_binop (mode, soptab, op0, op1, target,
2285                        unsignedp, OPTAB_WIDEN);
2286
2287   /* For unsigned operands, try widening to an unsigned int.  */
2288   if (!temp && unsignedp)
2289     temp = expand_binop (mode, uoptab, op0, op1, target,
2290                          unsignedp, OPTAB_WIDEN);
2291   if (temp || methods == OPTAB_WIDEN)
2292     goto egress;
2293
2294   /* Use the right width libcall if that exists.  */
2295   temp = expand_binop (mode, direct_optab, op0, op1, target,
2296                        unsignedp, OPTAB_LIB);
2297   if (temp || methods == OPTAB_LIB)
2298     goto egress;
2299
2300   /* Must widen and use a libcall, use either signed or unsigned.  */
2301   temp = expand_binop (mode, soptab, op0, op1, target,
2302                        unsignedp, methods);
2303   if (!temp && unsignedp)
2304     temp = expand_binop (mode, uoptab, op0, op1, target,
2305                          unsignedp, methods);
2306
2307  egress:
2308   /* Undo the fiddling above.  */
2309   if (save_enable)
2310     swap_optab_enable (soptab, mode, true);
2311   return temp;
2312 }
2313 \f
2314 /* Generate code to perform an operation specified by UNOPPTAB
2315    on operand OP0, with two results to TARG0 and TARG1.
2316    We assume that the order of the operands for the instruction
2317    is TARG0, TARG1, OP0.
2318
2319    Either TARG0 or TARG1 may be zero, but what that means is that
2320    the result is not actually wanted.  We will generate it into
2321    a dummy pseudo-reg and discard it.  They may not both be zero.
2322
2323    Returns 1 if this operation can be performed; 0 if not.  */
2324
2325 int
2326 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
2327                     int unsignedp)
2328 {
2329   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2330   enum mode_class mclass;
2331   enum machine_mode wider_mode;
2332   rtx_insn *entry_last = get_last_insn ();
2333   rtx_insn *last;
2334
2335   mclass = GET_MODE_CLASS (mode);
2336
2337   if (!targ0)
2338     targ0 = gen_reg_rtx (mode);
2339   if (!targ1)
2340     targ1 = gen_reg_rtx (mode);
2341
2342   /* Record where to go back to if we fail.  */
2343   last = get_last_insn ();
2344
2345   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2346     {
2347       struct expand_operand ops[3];
2348       enum insn_code icode = optab_handler (unoptab, mode);
2349
2350       create_fixed_operand (&ops[0], targ0);
2351       create_fixed_operand (&ops[1], targ1);
2352       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
2353       if (maybe_expand_insn (icode, 3, ops))
2354         return 1;
2355     }
2356
2357   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2358
2359   if (CLASS_HAS_WIDER_MODES_P (mclass))
2360     {
2361       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2362            wider_mode != VOIDmode;
2363            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2364         {
2365           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2366             {
2367               rtx t0 = gen_reg_rtx (wider_mode);
2368               rtx t1 = gen_reg_rtx (wider_mode);
2369               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2370
2371               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2372                 {
2373                   convert_move (targ0, t0, unsignedp);
2374                   convert_move (targ1, t1, unsignedp);
2375                   return 1;
2376                 }
2377               else
2378                 delete_insns_since (last);
2379             }
2380         }
2381     }
2382
2383   delete_insns_since (entry_last);
2384   return 0;
2385 }
2386 \f
2387 /* Generate code to perform an operation specified by BINOPTAB
2388    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2389    We assume that the order of the operands for the instruction
2390    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2391    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2392
2393    Either TARG0 or TARG1 may be zero, but what that means is that
2394    the result is not actually wanted.  We will generate it into
2395    a dummy pseudo-reg and discard it.  They may not both be zero.
2396
2397    Returns 1 if this operation can be performed; 0 if not.  */
2398
2399 int
2400 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2401                      int unsignedp)
2402 {
2403   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2404   enum mode_class mclass;
2405   enum machine_mode wider_mode;
2406   rtx_insn *entry_last = get_last_insn ();
2407   rtx_insn *last;
2408
2409   mclass = GET_MODE_CLASS (mode);
2410
2411   if (!targ0)
2412     targ0 = gen_reg_rtx (mode);
2413   if (!targ1)
2414     targ1 = gen_reg_rtx (mode);
2415
2416   /* Record where to go back to if we fail.  */
2417   last = get_last_insn ();
2418
2419   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2420     {
2421       struct expand_operand ops[4];
2422       enum insn_code icode = optab_handler (binoptab, mode);
2423       enum machine_mode mode0 = insn_data[icode].operand[1].mode;
2424       enum machine_mode mode1 = insn_data[icode].operand[2].mode;
2425       rtx xop0 = op0, xop1 = op1;
2426
2427       /* If we are optimizing, force expensive constants into a register.  */
2428       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2429       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2430
2431       create_fixed_operand (&ops[0], targ0);
2432       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2433       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2434       create_fixed_operand (&ops[3], targ1);
2435       if (maybe_expand_insn (icode, 4, ops))
2436         return 1;
2437       delete_insns_since (last);
2438     }
2439
2440   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2441
2442   if (CLASS_HAS_WIDER_MODES_P (mclass))
2443     {
2444       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2445            wider_mode != VOIDmode;
2446            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2447         {
2448           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2449             {
2450               rtx t0 = gen_reg_rtx (wider_mode);
2451               rtx t1 = gen_reg_rtx (wider_mode);
2452               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2453               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2454
2455               if (expand_twoval_binop (binoptab, cop0, cop1,
2456                                        t0, t1, unsignedp))
2457                 {
2458                   convert_move (targ0, t0, unsignedp);
2459                   convert_move (targ1, t1, unsignedp);
2460                   return 1;
2461                 }
2462               else
2463                 delete_insns_since (last);
2464             }
2465         }
2466     }
2467
2468   delete_insns_since (entry_last);
2469   return 0;
2470 }
2471
2472 /* Expand the two-valued library call indicated by BINOPTAB, but
2473    preserve only one of the values.  If TARG0 is non-NULL, the first
2474    value is placed into TARG0; otherwise the second value is placed
2475    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2476    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2477    This routine assumes that the value returned by the library call is
2478    as if the return value was of an integral mode twice as wide as the
2479    mode of OP0.  Returns 1 if the call was successful.  */
2480
2481 bool
2482 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2483                              rtx targ0, rtx targ1, enum rtx_code code)
2484 {
2485   enum machine_mode mode;
2486   enum machine_mode libval_mode;
2487   rtx libval;
2488   rtx_insn *insns;
2489   rtx libfunc;
2490
2491   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2492   gcc_assert (!targ0 != !targ1);
2493
2494   mode = GET_MODE (op0);
2495   libfunc = optab_libfunc (binoptab, mode);
2496   if (!libfunc)
2497     return false;
2498
2499   /* The value returned by the library function will have twice as
2500      many bits as the nominal MODE.  */
2501   libval_mode = smallest_mode_for_size (2 * GET_MODE_BITSIZE (mode),
2502                                         MODE_INT);
2503   start_sequence ();
2504   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2505                                     libval_mode, 2,
2506                                     op0, mode,
2507                                     op1, mode);
2508   /* Get the part of VAL containing the value that we want.  */
2509   libval = simplify_gen_subreg (mode, libval, libval_mode,
2510                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2511   insns = get_insns ();
2512   end_sequence ();
2513   /* Move the into the desired location.  */
2514   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2515                       gen_rtx_fmt_ee (code, mode, op0, op1));
2516
2517   return true;
2518 }
2519
2520 \f
2521 /* Wrapper around expand_unop which takes an rtx code to specify
2522    the operation to perform, not an optab pointer.  All other
2523    arguments are the same.  */
2524 rtx
2525 expand_simple_unop (enum machine_mode mode, enum rtx_code code, rtx op0,
2526                     rtx target, int unsignedp)
2527 {
2528   optab unop = code_to_optab (code);
2529   gcc_assert (unop);
2530
2531   return expand_unop (mode, unop, op0, target, unsignedp);
2532 }
2533
2534 /* Try calculating
2535         (clz:narrow x)
2536    as
2537         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2538
2539    A similar operation can be used for clrsb.  UNOPTAB says which operation
2540    we are trying to expand.  */
2541 static rtx
2542 widen_leading (enum machine_mode mode, rtx op0, rtx target, optab unoptab)
2543 {
2544   enum mode_class mclass = GET_MODE_CLASS (mode);
2545   if (CLASS_HAS_WIDER_MODES_P (mclass))
2546     {
2547       enum machine_mode wider_mode;
2548       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2549            wider_mode != VOIDmode;
2550            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2551         {
2552           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2553             {
2554               rtx xop0, temp;
2555               rtx_insn *last;
2556
2557               last = get_last_insn ();
2558
2559               if (target == 0)
2560                 target = gen_reg_rtx (mode);
2561               xop0 = widen_operand (op0, wider_mode, mode,
2562                                     unoptab != clrsb_optab, false);
2563               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2564                                   unoptab != clrsb_optab);
2565               if (temp != 0)
2566                 temp = expand_binop
2567                   (wider_mode, sub_optab, temp,
2568                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
2569                                  - GET_MODE_PRECISION (mode),
2570                                  wider_mode),
2571                    target, true, OPTAB_DIRECT);
2572               if (temp == 0)
2573                 delete_insns_since (last);
2574
2575               return temp;
2576             }
2577         }
2578     }
2579   return 0;
2580 }
2581
2582 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2583    quantities, choosing which based on whether the high word is nonzero.  */
2584 static rtx
2585 expand_doubleword_clz (enum machine_mode mode, rtx op0, rtx target)
2586 {
2587   rtx xop0 = force_reg (mode, op0);
2588   rtx subhi = gen_highpart (word_mode, xop0);
2589   rtx sublo = gen_lowpart (word_mode, xop0);
2590   rtx_code_label *hi0_label = gen_label_rtx ();
2591   rtx_code_label *after_label = gen_label_rtx ();
2592   rtx_insn *seq;
2593   rtx temp, result;
2594
2595   /* If we were not given a target, use a word_mode register, not a
2596      'mode' register.  The result will fit, and nobody is expecting
2597      anything bigger (the return type of __builtin_clz* is int).  */
2598   if (!target)
2599     target = gen_reg_rtx (word_mode);
2600
2601   /* In any case, write to a word_mode scratch in both branches of the
2602      conditional, so we can ensure there is a single move insn setting
2603      'target' to tag a REG_EQUAL note on.  */
2604   result = gen_reg_rtx (word_mode);
2605
2606   start_sequence ();
2607
2608   /* If the high word is not equal to zero,
2609      then clz of the full value is clz of the high word.  */
2610   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2611                            word_mode, true, hi0_label);
2612
2613   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2614   if (!temp)
2615     goto fail;
2616
2617   if (temp != result)
2618     convert_move (result, temp, true);
2619
2620   emit_jump_insn (gen_jump (after_label));
2621   emit_barrier ();
2622
2623   /* Else clz of the full value is clz of the low word plus the number
2624      of bits in the high word.  */
2625   emit_label (hi0_label);
2626
2627   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2628   if (!temp)
2629     goto fail;
2630   temp = expand_binop (word_mode, add_optab, temp,
2631                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2632                        result, true, OPTAB_DIRECT);
2633   if (!temp)
2634     goto fail;
2635   if (temp != result)
2636     convert_move (result, temp, true);
2637
2638   emit_label (after_label);
2639   convert_move (target, result, true);
2640
2641   seq = get_insns ();
2642   end_sequence ();
2643
2644   add_equal_note (seq, target, CLZ, xop0, 0);
2645   emit_insn (seq);
2646   return target;
2647
2648  fail:
2649   end_sequence ();
2650   return 0;
2651 }
2652
2653 /* Try calculating
2654         (bswap:narrow x)
2655    as
2656         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2657 static rtx
2658 widen_bswap (enum machine_mode mode, rtx op0, rtx target)
2659 {
2660   enum mode_class mclass = GET_MODE_CLASS (mode);
2661   enum machine_mode wider_mode;
2662   rtx x;
2663   rtx_insn *last;
2664
2665   if (!CLASS_HAS_WIDER_MODES_P (mclass))
2666     return NULL_RTX;
2667
2668   for (wider_mode = GET_MODE_WIDER_MODE (mode);
2669        wider_mode != VOIDmode;
2670        wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2671     if (optab_handler (bswap_optab, wider_mode) != CODE_FOR_nothing)
2672       goto found;
2673   return NULL_RTX;
2674
2675  found:
2676   last = get_last_insn ();
2677
2678   x = widen_operand (op0, wider_mode, mode, true, true);
2679   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2680
2681   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2682               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2683   if (x != 0)
2684     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2685                       GET_MODE_BITSIZE (wider_mode)
2686                       - GET_MODE_BITSIZE (mode),
2687                       NULL_RTX, true);
2688
2689   if (x != 0)
2690     {
2691       if (target == 0)
2692         target = gen_reg_rtx (mode);
2693       emit_move_insn (target, gen_lowpart (mode, x));
2694     }
2695   else
2696     delete_insns_since (last);
2697
2698   return target;
2699 }
2700
2701 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2702
2703 static rtx
2704 expand_doubleword_bswap (enum machine_mode mode, rtx op, rtx target)
2705 {
2706   rtx t0, t1;
2707
2708   t1 = expand_unop (word_mode, bswap_optab,
2709                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2710   t0 = expand_unop (word_mode, bswap_optab,
2711                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2712
2713   if (target == 0 || !valid_multiword_target_p (target))
2714     target = gen_reg_rtx (mode);
2715   if (REG_P (target))
2716     emit_clobber (target);
2717   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2718   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2719
2720   return target;
2721 }
2722
2723 /* Try calculating (parity x) as (and (popcount x) 1), where
2724    popcount can also be done in a wider mode.  */
2725 static rtx
2726 expand_parity (enum machine_mode mode, rtx op0, rtx target)
2727 {
2728   enum mode_class mclass = GET_MODE_CLASS (mode);
2729   if (CLASS_HAS_WIDER_MODES_P (mclass))
2730     {
2731       enum machine_mode wider_mode;
2732       for (wider_mode = mode; wider_mode != VOIDmode;
2733            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2734         {
2735           if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2736             {
2737               rtx xop0, temp;
2738               rtx_insn *last;
2739
2740               last = get_last_insn ();
2741
2742               if (target == 0)
2743                 target = gen_reg_rtx (mode);
2744               xop0 = widen_operand (op0, wider_mode, mode, true, false);
2745               temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2746                                   true);
2747               if (temp != 0)
2748                 temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2749                                      target, true, OPTAB_DIRECT);
2750               if (temp == 0)
2751                 delete_insns_since (last);
2752
2753               return temp;
2754             }
2755         }
2756     }
2757   return 0;
2758 }
2759
2760 /* Try calculating ctz(x) as K - clz(x & -x) ,
2761    where K is GET_MODE_PRECISION(mode) - 1.
2762
2763    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2764    don't have to worry about what the hardware does in that case.  (If
2765    the clz instruction produces the usual value at 0, which is K, the
2766    result of this code sequence will be -1; expand_ffs, below, relies
2767    on this.  It might be nice to have it be K instead, for consistency
2768    with the (very few) processors that provide a ctz with a defined
2769    value, but that would take one more instruction, and it would be
2770    less convenient for expand_ffs anyway.  */
2771
2772 static rtx
2773 expand_ctz (enum machine_mode mode, rtx op0, rtx target)
2774 {
2775   rtx_insn *seq;
2776   rtx temp;
2777
2778   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2779     return 0;
2780
2781   start_sequence ();
2782
2783   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2784   if (temp)
2785     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2786                          true, OPTAB_DIRECT);
2787   if (temp)
2788     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2789   if (temp)
2790     temp = expand_binop (mode, sub_optab,
2791                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2792                          temp, target,
2793                          true, OPTAB_DIRECT);
2794   if (temp == 0)
2795     {
2796       end_sequence ();
2797       return 0;
2798     }
2799
2800   seq = get_insns ();
2801   end_sequence ();
2802
2803   add_equal_note (seq, temp, CTZ, op0, 0);
2804   emit_insn (seq);
2805   return temp;
2806 }
2807
2808
2809 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2810    else with the sequence used by expand_clz.
2811
2812    The ffs builtin promises to return zero for a zero value and ctz/clz
2813    may have an undefined value in that case.  If they do not give us a
2814    convenient value, we have to generate a test and branch.  */
2815 static rtx
2816 expand_ffs (enum machine_mode mode, rtx op0, rtx target)
2817 {
2818   HOST_WIDE_INT val = 0;
2819   bool defined_at_zero = false;
2820   rtx temp;
2821   rtx_insn *seq;
2822
2823   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2824     {
2825       start_sequence ();
2826
2827       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2828       if (!temp)
2829         goto fail;
2830
2831       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2832     }
2833   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2834     {
2835       start_sequence ();
2836       temp = expand_ctz (mode, op0, 0);
2837       if (!temp)
2838         goto fail;
2839
2840       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2841         {
2842           defined_at_zero = true;
2843           val = (GET_MODE_PRECISION (mode) - 1) - val;
2844         }
2845     }
2846   else
2847     return 0;
2848
2849   if (defined_at_zero && val == -1)
2850     /* No correction needed at zero.  */;
2851   else
2852     {
2853       /* We don't try to do anything clever with the situation found
2854          on some processors (eg Alpha) where ctz(0:mode) ==
2855          bitsize(mode).  If someone can think of a way to send N to -1
2856          and leave alone all values in the range 0..N-1 (where N is a
2857          power of two), cheaper than this test-and-branch, please add it.
2858
2859          The test-and-branch is done after the operation itself, in case
2860          the operation sets condition codes that can be recycled for this.
2861          (This is true on i386, for instance.)  */
2862
2863       rtx_code_label *nonzero_label = gen_label_rtx ();
2864       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2865                                mode, true, nonzero_label);
2866
2867       convert_move (temp, GEN_INT (-1), false);
2868       emit_label (nonzero_label);
2869     }
2870
2871   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2872      to produce a value in the range 0..bitsize.  */
2873   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2874                        target, false, OPTAB_DIRECT);
2875   if (!temp)
2876     goto fail;
2877
2878   seq = get_insns ();
2879   end_sequence ();
2880
2881   add_equal_note (seq, temp, FFS, op0, 0);
2882   emit_insn (seq);
2883   return temp;
2884
2885  fail:
2886   end_sequence ();
2887   return 0;
2888 }
2889
2890 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2891    conditions, VAL may already be a SUBREG against which we cannot generate
2892    a further SUBREG.  In this case, we expect forcing the value into a
2893    register will work around the situation.  */
2894
2895 static rtx
2896 lowpart_subreg_maybe_copy (enum machine_mode omode, rtx val,
2897                            enum machine_mode imode)
2898 {
2899   rtx ret;
2900   ret = lowpart_subreg (omode, val, imode);
2901   if (ret == NULL)
2902     {
2903       val = force_reg (imode, val);
2904       ret = lowpart_subreg (omode, val, imode);
2905       gcc_assert (ret != NULL);
2906     }
2907   return ret;
2908 }
2909
2910 /* Expand a floating point absolute value or negation operation via a
2911    logical operation on the sign bit.  */
2912
2913 static rtx
2914 expand_absneg_bit (enum rtx_code code, enum machine_mode mode,
2915                    rtx op0, rtx target)
2916 {
2917   const struct real_format *fmt;
2918   int bitpos, word, nwords, i;
2919   enum machine_mode imode;
2920   rtx temp;
2921   rtx_insn *insns;
2922
2923   /* The format has to have a simple sign bit.  */
2924   fmt = REAL_MODE_FORMAT (mode);
2925   if (fmt == NULL)
2926     return NULL_RTX;
2927
2928   bitpos = fmt->signbit_rw;
2929   if (bitpos < 0)
2930     return NULL_RTX;
2931
2932   /* Don't create negative zeros if the format doesn't support them.  */
2933   if (code == NEG && !fmt->has_signed_zero)
2934     return NULL_RTX;
2935
2936   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2937     {
2938       imode = int_mode_for_mode (mode);
2939       if (imode == BLKmode)
2940         return NULL_RTX;
2941       word = 0;
2942       nwords = 1;
2943     }
2944   else
2945     {
2946       imode = word_mode;
2947
2948       if (FLOAT_WORDS_BIG_ENDIAN)
2949         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2950       else
2951         word = bitpos / BITS_PER_WORD;
2952       bitpos = bitpos % BITS_PER_WORD;
2953       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2954     }
2955
2956   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2957   if (code == ABS)
2958     mask = ~mask;
2959
2960   if (target == 0
2961       || target == op0
2962       || (nwords > 1 && !valid_multiword_target_p (target)))
2963     target = gen_reg_rtx (mode);
2964
2965   if (nwords > 1)
2966     {
2967       start_sequence ();
2968
2969       for (i = 0; i < nwords; ++i)
2970         {
2971           rtx targ_piece = operand_subword (target, i, 1, mode);
2972           rtx op0_piece = operand_subword_force (op0, i, mode);
2973
2974           if (i == word)
2975             {
2976               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2977                                    op0_piece,
2978                                    immed_wide_int_const (mask, imode),
2979                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2980               if (temp != targ_piece)
2981                 emit_move_insn (targ_piece, temp);
2982             }
2983           else
2984             emit_move_insn (targ_piece, op0_piece);
2985         }
2986
2987       insns = get_insns ();
2988       end_sequence ();
2989
2990       emit_insn (insns);
2991     }
2992   else
2993     {
2994       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2995                            gen_lowpart (imode, op0),
2996                            immed_wide_int_const (mask, imode),
2997                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2998       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2999
3000       set_dst_reg_note (get_last_insn (), REG_EQUAL,
3001                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
3002                         target);
3003     }
3004
3005   return target;
3006 }
3007
3008 /* As expand_unop, but will fail rather than attempt the operation in a
3009    different mode or with a libcall.  */
3010 static rtx
3011 expand_unop_direct (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
3012              int unsignedp)
3013 {
3014   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
3015     {
3016       struct expand_operand ops[2];
3017       enum insn_code icode = optab_handler (unoptab, mode);
3018       rtx_insn *last = get_last_insn ();
3019       rtx pat;
3020
3021       create_output_operand (&ops[0], target, mode);
3022       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
3023       pat = maybe_gen_insn (icode, 2, ops);
3024       if (pat)
3025         {
3026           if (INSN_P (pat) && NEXT_INSN (as_a <rtx_insn *> (pat)) != NULL_RTX
3027               && ! add_equal_note (as_a <rtx_insn *> (pat), ops[0].value,
3028                                    optab_to_code (unoptab),
3029                                    ops[1].value, NULL_RTX))
3030             {
3031               delete_insns_since (last);
3032               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
3033             }
3034
3035           emit_insn (pat);
3036
3037           return ops[0].value;
3038         }
3039     }
3040   return 0;
3041 }
3042
3043 /* Generate code to perform an operation specified by UNOPTAB
3044    on operand OP0, with result having machine-mode MODE.
3045
3046    UNSIGNEDP is for the case where we have to widen the operands
3047    to perform the operation.  It says to use zero-extension.
3048
3049    If TARGET is nonzero, the value
3050    is generated there, if it is convenient to do so.
3051    In all cases an rtx is returned for the locus of the value;
3052    this may or may not be TARGET.  */
3053
3054 rtx
3055 expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
3056              int unsignedp)
3057 {
3058   enum mode_class mclass = GET_MODE_CLASS (mode);
3059   enum machine_mode wider_mode;
3060   rtx temp;
3061   rtx libfunc;
3062
3063   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
3064   if (temp)
3065     return temp;
3066
3067   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
3068
3069   /* Widening (or narrowing) clz needs special treatment.  */
3070   if (unoptab == clz_optab)
3071     {
3072       temp = widen_leading (mode, op0, target, unoptab);
3073       if (temp)
3074         return temp;
3075
3076       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3077           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3078         {
3079           temp = expand_doubleword_clz (mode, op0, target);
3080           if (temp)
3081             return temp;
3082         }
3083
3084       goto try_libcall;
3085     }
3086
3087   if (unoptab == clrsb_optab)
3088     {
3089       temp = widen_leading (mode, op0, target, unoptab);
3090       if (temp)
3091         return temp;
3092       goto try_libcall;
3093     }
3094
3095   /* Widening (or narrowing) bswap needs special treatment.  */
3096   if (unoptab == bswap_optab)
3097     {
3098       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
3099          or ROTATERT.  First try these directly; if this fails, then try the
3100          obvious pair of shifts with allowed widening, as this will probably
3101          be always more efficient than the other fallback methods.  */
3102       if (mode == HImode)
3103         {
3104           rtx_insn *last;
3105           rtx temp1, temp2;
3106
3107           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
3108             {
3109               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
3110                                    unsignedp, OPTAB_DIRECT);
3111               if (temp)
3112                 return temp;
3113              }
3114
3115           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
3116             {
3117               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
3118                                    unsignedp, OPTAB_DIRECT);
3119               if (temp)
3120                 return temp;
3121             }
3122
3123           last = get_last_insn ();
3124
3125           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
3126                                 unsignedp, OPTAB_WIDEN);
3127           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
3128                                 unsignedp, OPTAB_WIDEN);
3129           if (temp1 && temp2)
3130             {
3131               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
3132                                    unsignedp, OPTAB_WIDEN);
3133               if (temp)
3134                 return temp;
3135             }
3136
3137           delete_insns_since (last);
3138         }
3139
3140       temp = widen_bswap (mode, op0, target);
3141       if (temp)
3142         return temp;
3143
3144       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3145           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3146         {
3147           temp = expand_doubleword_bswap (mode, op0, target);
3148           if (temp)
3149             return temp;
3150         }
3151
3152       goto try_libcall;
3153     }
3154
3155   if (CLASS_HAS_WIDER_MODES_P (mclass))
3156     for (wider_mode = GET_MODE_WIDER_MODE (mode);
3157          wider_mode != VOIDmode;
3158          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3159       {
3160         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
3161           {
3162             rtx xop0 = op0;
3163             rtx_insn *last = get_last_insn ();
3164
3165             /* For certain operations, we need not actually extend
3166                the narrow operand, as long as we will truncate the
3167                results to the same narrowness.  */
3168
3169             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3170                                   (unoptab == neg_optab
3171                                    || unoptab == one_cmpl_optab)
3172                                   && mclass == MODE_INT);
3173
3174             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3175                                 unsignedp);
3176
3177             if (temp)
3178               {
3179                 if (mclass != MODE_INT
3180                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
3181                   {
3182                     if (target == 0)
3183                       target = gen_reg_rtx (mode);
3184                     convert_move (target, temp, 0);
3185                     return target;
3186                   }
3187                 else
3188                   return gen_lowpart (mode, temp);
3189               }
3190             else
3191               delete_insns_since (last);
3192           }
3193       }
3194
3195   /* These can be done a word at a time.  */
3196   if (unoptab == one_cmpl_optab
3197       && mclass == MODE_INT
3198       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
3199       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3200     {
3201       int i;
3202       rtx_insn *insns;
3203
3204       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
3205         target = gen_reg_rtx (mode);
3206
3207       start_sequence ();
3208
3209       /* Do the actual arithmetic.  */
3210       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
3211         {
3212           rtx target_piece = operand_subword (target, i, 1, mode);
3213           rtx x = expand_unop (word_mode, unoptab,
3214                                operand_subword_force (op0, i, mode),
3215                                target_piece, unsignedp);
3216
3217           if (target_piece != x)
3218             emit_move_insn (target_piece, x);
3219         }
3220
3221       insns = get_insns ();
3222       end_sequence ();
3223
3224       emit_insn (insns);
3225       return target;
3226     }
3227
3228   if (optab_to_code (unoptab) == NEG)
3229     {
3230       /* Try negating floating point values by flipping the sign bit.  */
3231       if (SCALAR_FLOAT_MODE_P (mode))
3232         {
3233           temp = expand_absneg_bit (NEG, mode, op0, target);
3234           if (temp)
3235             return temp;
3236         }
3237
3238       /* If there is no negation pattern, and we have no negative zero,
3239          try subtracting from zero.  */
3240       if (!HONOR_SIGNED_ZEROS (mode))
3241         {
3242           temp = expand_binop (mode, (unoptab == negv_optab
3243                                       ? subv_optab : sub_optab),
3244                                CONST0_RTX (mode), op0, target,
3245                                unsignedp, OPTAB_DIRECT);
3246           if (temp)
3247             return temp;
3248         }
3249     }
3250
3251   /* Try calculating parity (x) as popcount (x) % 2.  */
3252   if (unoptab == parity_optab)
3253     {
3254       temp = expand_parity (mode, op0, target);
3255       if (temp)
3256         return temp;
3257     }
3258
3259   /* Try implementing ffs (x) in terms of clz (x).  */
3260   if (unoptab == ffs_optab)
3261     {
3262       temp = expand_ffs (mode, op0, target);
3263       if (temp)
3264         return temp;
3265     }
3266
3267   /* Try implementing ctz (x) in terms of clz (x).  */
3268   if (unoptab == ctz_optab)
3269     {
3270       temp = expand_ctz (mode, op0, target);
3271       if (temp)
3272         return temp;
3273     }
3274
3275  try_libcall:
3276   /* Now try a library call in this mode.  */
3277   libfunc = optab_libfunc (unoptab, mode);
3278   if (libfunc)
3279     {
3280       rtx_insn *insns;
3281       rtx value;
3282       rtx eq_value;
3283       enum machine_mode outmode = mode;
3284
3285       /* All of these functions return small values.  Thus we choose to
3286          have them return something that isn't a double-word.  */
3287       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3288           || unoptab == clrsb_optab || unoptab == popcount_optab
3289           || unoptab == parity_optab)
3290         outmode
3291           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3292                                           optab_libfunc (unoptab, mode)));
3293
3294       start_sequence ();
3295
3296       /* Pass 1 for NO_QUEUE so we don't lose any increments
3297          if the libcall is cse'd or moved.  */
3298       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3299                                        1, op0, mode);
3300       insns = get_insns ();
3301       end_sequence ();
3302
3303       target = gen_reg_rtx (outmode);
3304       eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3305       if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
3306         eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3307       else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
3308         eq_value = simplify_gen_unary (ZERO_EXTEND, outmode, eq_value, mode);
3309       emit_libcall_block_1 (insns, target, value, eq_value,
3310                             trapv_unoptab_p (unoptab));
3311
3312       return target;
3313     }
3314
3315   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3316
3317   if (CLASS_HAS_WIDER_MODES_P (mclass))
3318     {
3319       for (wider_mode = GET_MODE_WIDER_MODE (mode);
3320            wider_mode != VOIDmode;
3321            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3322         {
3323           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3324               || optab_libfunc (unoptab, wider_mode))
3325             {
3326               rtx xop0 = op0;
3327               rtx_insn *last = get_last_insn ();
3328
3329               /* For certain operations, we need not actually extend
3330                  the narrow operand, as long as we will truncate the
3331                  results to the same narrowness.  */
3332               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3333                                     (unoptab == neg_optab
3334                                      || unoptab == one_cmpl_optab
3335                                      || unoptab == bswap_optab)
3336                                     && mclass == MODE_INT);
3337
3338               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3339                                   unsignedp);
3340
3341               /* If we are generating clz using wider mode, adjust the
3342                  result.  Similarly for clrsb.  */
3343               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3344                   && temp != 0)
3345                 temp = expand_binop
3346                   (wider_mode, sub_optab, temp,
3347                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
3348                                  - GET_MODE_PRECISION (mode),
3349                                  wider_mode),
3350                    target, true, OPTAB_DIRECT);
3351
3352               /* Likewise for bswap.  */
3353               if (unoptab == bswap_optab && temp != 0)
3354                 {
3355                   gcc_assert (GET_MODE_PRECISION (wider_mode)
3356                               == GET_MODE_BITSIZE (wider_mode)
3357                               && GET_MODE_PRECISION (mode)
3358                                  == GET_MODE_BITSIZE (mode));
3359
3360                   temp = expand_shift (RSHIFT_EXPR, wider_mode, temp,
3361                                        GET_MODE_BITSIZE (wider_mode)
3362                                        - GET_MODE_BITSIZE (mode),
3363                                        NULL_RTX, true);
3364                 }
3365
3366               if (temp)
3367                 {
3368                   if (mclass != MODE_INT)
3369                     {
3370                       if (target == 0)
3371                         target = gen_reg_rtx (mode);
3372                       convert_move (target, temp, 0);
3373                       return target;
3374                     }
3375                   else
3376                     return gen_lowpart (mode, temp);
3377                 }
3378               else
3379                 delete_insns_since (last);
3380             }
3381         }
3382     }
3383
3384   /* One final attempt at implementing negation via subtraction,
3385      this time allowing widening of the operand.  */
3386   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3387     {
3388       rtx temp;
3389       temp = expand_binop (mode,
3390                            unoptab == negv_optab ? subv_optab : sub_optab,
3391                            CONST0_RTX (mode), op0,
3392                            target, unsignedp, OPTAB_LIB_WIDEN);
3393       if (temp)
3394         return temp;
3395     }
3396
3397   return 0;
3398 }
3399 \f
3400 /* Emit code to compute the absolute value of OP0, with result to
3401    TARGET if convenient.  (TARGET may be 0.)  The return value says
3402    where the result actually is to be found.
3403
3404    MODE is the mode of the operand; the mode of the result is
3405    different but can be deduced from MODE.
3406
3407  */
3408
3409 rtx
3410 expand_abs_nojump (enum machine_mode mode, rtx op0, rtx target,
3411                    int result_unsignedp)
3412 {
3413   rtx temp;
3414
3415   if (GET_MODE_CLASS (mode) != MODE_INT
3416       || ! flag_trapv)
3417     result_unsignedp = 1;
3418
3419   /* First try to do it with a special abs instruction.  */
3420   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3421                       op0, target, 0);
3422   if (temp != 0)
3423     return temp;
3424
3425   /* For floating point modes, try clearing the sign bit.  */
3426   if (SCALAR_FLOAT_MODE_P (mode))
3427     {
3428       temp = expand_absneg_bit (ABS, mode, op0, target);
3429       if (temp)
3430         return temp;
3431     }
3432
3433   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3434   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3435       && !HONOR_SIGNED_ZEROS (mode))
3436     {
3437       rtx_insn *last = get_last_insn ();
3438
3439       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3440                           op0, NULL_RTX, 0);
3441       if (temp != 0)
3442         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3443                              OPTAB_WIDEN);
3444
3445       if (temp != 0)
3446         return temp;
3447
3448       delete_insns_since (last);
3449     }
3450
3451   /* If this machine has expensive jumps, we can do integer absolute
3452      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3453      where W is the width of MODE.  */
3454
3455   if (GET_MODE_CLASS (mode) == MODE_INT
3456       && BRANCH_COST (optimize_insn_for_speed_p (),
3457                       false) >= 2)
3458     {
3459       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3460                                    GET_MODE_PRECISION (mode) - 1,
3461                                    NULL_RTX, 0);
3462
3463       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3464                            OPTAB_LIB_WIDEN);
3465       if (temp != 0)
3466         temp = expand_binop (mode, result_unsignedp ? sub_optab : subv_optab,
3467                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3468
3469       if (temp != 0)
3470         return temp;
3471     }
3472
3473   return NULL_RTX;
3474 }
3475
3476 rtx
3477 expand_abs (enum machine_mode mode, rtx op0, rtx target,
3478             int result_unsignedp, int safe)
3479 {
3480   rtx temp;
3481   rtx_code_label *op1;
3482
3483   if (GET_MODE_CLASS (mode) != MODE_INT
3484       || ! flag_trapv)
3485     result_unsignedp = 1;
3486
3487   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3488   if (temp != 0)
3489     return temp;
3490
3491   /* If that does not win, use conditional jump and negate.  */
3492
3493   /* It is safe to use the target if it is the same
3494      as the source if this is also a pseudo register */
3495   if (op0 == target && REG_P (op0)
3496       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3497     safe = 1;
3498
3499   op1 = gen_label_rtx ();
3500   if (target == 0 || ! safe
3501       || GET_MODE (target) != mode
3502       || (MEM_P (target) && MEM_VOLATILE_P (target))
3503       || (REG_P (target)
3504           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3505     target = gen_reg_rtx (mode);
3506
3507   emit_move_insn (target, op0);
3508   NO_DEFER_POP;
3509
3510   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3511                            NULL_RTX, NULL_RTX, op1, -1);
3512
3513   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3514                      target, target, 0);
3515   if (op0 != target)
3516     emit_move_insn (target, op0);
3517   emit_label (op1);
3518   OK_DEFER_POP;
3519   return target;
3520 }
3521
3522 /* Emit code to compute the one's complement absolute value of OP0
3523    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3524    (TARGET may be NULL_RTX.)  The return value says where the result
3525    actually is to be found.
3526
3527    MODE is the mode of the operand; the mode of the result is
3528    different but can be deduced from MODE.  */
3529
3530 rtx
3531 expand_one_cmpl_abs_nojump (enum machine_mode mode, rtx op0, rtx target)
3532 {
3533   rtx temp;
3534
3535   /* Not applicable for floating point modes.  */
3536   if (FLOAT_MODE_P (mode))
3537     return NULL_RTX;
3538
3539   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3540   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3541     {
3542       rtx_insn *last = get_last_insn ();
3543
3544       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3545       if (temp != 0)
3546         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3547                              OPTAB_WIDEN);
3548
3549       if (temp != 0)
3550         return temp;
3551
3552       delete_insns_since (last);
3553     }
3554
3555   /* If this machine has expensive jumps, we can do one's complement
3556      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3557
3558   if (GET_MODE_CLASS (mode) == MODE_INT
3559       && BRANCH_COST (optimize_insn_for_speed_p (),
3560                      false) >= 2)
3561     {
3562       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3563                                    GET_MODE_PRECISION (mode) - 1,
3564                                    NULL_RTX, 0);
3565
3566       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3567                            OPTAB_LIB_WIDEN);
3568
3569       if (temp != 0)
3570         return temp;
3571     }
3572
3573   return NULL_RTX;
3574 }
3575
3576 /* A subroutine of expand_copysign, perform the copysign operation using the
3577    abs and neg primitives advertised to exist on the target.  The assumption
3578    is that we have a split register file, and leaving op0 in fp registers,
3579    and not playing with subregs so much, will help the register allocator.  */
3580
3581 static rtx
3582 expand_copysign_absneg (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3583                         int bitpos, bool op0_is_abs)
3584 {
3585   enum machine_mode imode;
3586   enum insn_code icode;
3587   rtx sign;
3588   rtx_code_label *label;
3589
3590   if (target == op1)
3591     target = NULL_RTX;
3592
3593   /* Check if the back end provides an insn that handles signbit for the
3594      argument's mode. */
3595   icode = optab_handler (signbit_optab, mode);
3596   if (icode != CODE_FOR_nothing)
3597     {
3598       imode = insn_data[(int) icode].operand[0].mode;
3599       sign = gen_reg_rtx (imode);
3600       emit_unop_insn (icode, sign, op1, UNKNOWN);
3601     }
3602   else
3603     {
3604       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3605         {
3606           imode = int_mode_for_mode (mode);
3607           if (imode == BLKmode)
3608             return NULL_RTX;
3609           op1 = gen_lowpart (imode, op1);
3610         }
3611       else
3612         {
3613           int word;
3614
3615           imode = word_mode;
3616           if (FLOAT_WORDS_BIG_ENDIAN)
3617             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3618           else
3619             word = bitpos / BITS_PER_WORD;
3620           bitpos = bitpos % BITS_PER_WORD;
3621           op1 = operand_subword_force (op1, word, mode);
3622         }
3623
3624       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3625       sign = expand_binop (imode, and_optab, op1,
3626                            immed_wide_int_const (mask, imode),
3627                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3628     }
3629
3630   if (!op0_is_abs)
3631     {
3632       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3633       if (op0 == NULL)
3634         return NULL_RTX;
3635       target = op0;
3636     }
3637   else
3638     {
3639       if (target == NULL_RTX)
3640         target = copy_to_reg (op0);
3641       else
3642         emit_move_insn (target, op0);
3643     }
3644
3645   label = gen_label_rtx ();
3646   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3647
3648   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3649     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3650   else
3651     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3652   if (op0 != target)
3653     emit_move_insn (target, op0);
3654
3655   emit_label (label);
3656
3657   return target;
3658 }
3659
3660
3661 /* A subroutine of expand_copysign, perform the entire copysign operation
3662    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3663    is true if op0 is known to have its sign bit clear.  */
3664
3665 static rtx
3666 expand_copysign_bit (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3667                      int bitpos, bool op0_is_abs)
3668 {
3669   enum machine_mode imode;
3670   int word, nwords, i;
3671   rtx temp;
3672   rtx_insn *insns;
3673
3674   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3675     {
3676       imode = int_mode_for_mode (mode);
3677       if (imode == BLKmode)
3678         return NULL_RTX;
3679       word = 0;
3680       nwords = 1;
3681     }
3682   else
3683     {
3684       imode = word_mode;
3685
3686       if (FLOAT_WORDS_BIG_ENDIAN)
3687         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3688       else
3689         word = bitpos / BITS_PER_WORD;
3690       bitpos = bitpos % BITS_PER_WORD;
3691       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3692     }
3693
3694   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3695
3696   if (target == 0
3697       || target == op0
3698       || target == op1
3699       || (nwords > 1 && !valid_multiword_target_p (target)))
3700     target = gen_reg_rtx (mode);
3701
3702   if (nwords > 1)
3703     {
3704       start_sequence ();
3705
3706       for (i = 0; i < nwords; ++i)
3707         {
3708           rtx targ_piece = operand_subword (target, i, 1, mode);
3709           rtx op0_piece = operand_subword_force (op0, i, mode);
3710
3711           if (i == word)
3712             {
3713               if (!op0_is_abs)
3714                 op0_piece
3715                   = expand_binop (imode, and_optab, op0_piece,
3716                                   immed_wide_int_const (~mask, imode),
3717                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3718               op1 = expand_binop (imode, and_optab,
3719                                   operand_subword_force (op1, i, mode),
3720                                   immed_wide_int_const (mask, imode),
3721                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3722
3723               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3724                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3725               if (temp != targ_piece)
3726                 emit_move_insn (targ_piece, temp);
3727             }
3728           else
3729             emit_move_insn (targ_piece, op0_piece);
3730         }
3731
3732       insns = get_insns ();
3733       end_sequence ();
3734
3735       emit_insn (insns);
3736     }
3737   else
3738     {
3739       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3740                           immed_wide_int_const (mask, imode),
3741                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3742
3743       op0 = gen_lowpart (imode, op0);
3744       if (!op0_is_abs)
3745         op0 = expand_binop (imode, and_optab, op0,
3746                             immed_wide_int_const (~mask, imode),
3747                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3748
3749       temp = expand_binop (imode, ior_optab, op0, op1,
3750                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3751       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3752     }
3753
3754   return target;
3755 }
3756
3757 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3758    scalar floating point mode.  Return NULL if we do not know how to
3759    expand the operation inline.  */
3760
3761 rtx
3762 expand_copysign (rtx op0, rtx op1, rtx target)
3763 {
3764   enum machine_mode mode = GET_MODE (op0);
3765   const struct real_format *fmt;
3766   bool op0_is_abs;
3767   rtx temp;
3768
3769   gcc_assert (SCALAR_FLOAT_MODE_P (mode));
3770   gcc_assert (GET_MODE (op1) == mode);
3771
3772   /* First try to do it with a special instruction.  */
3773   temp = expand_binop (mode, copysign_optab, op0, op1,
3774                        target, 0, OPTAB_DIRECT);
3775   if (temp)
3776     return temp;
3777
3778   fmt = REAL_MODE_FORMAT (mode);
3779   if (fmt == NULL || !fmt->has_signed_zero)
3780     return NULL_RTX;
3781
3782   op0_is_abs = false;
3783   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3784     {
3785       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3786         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3787       op0_is_abs = true;
3788     }
3789
3790   if (fmt->signbit_ro >= 0
3791       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3792           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3793               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3794     {
3795       temp = expand_copysign_absneg (mode, op0, op1, target,
3796                                      fmt->signbit_ro, op0_is_abs);
3797       if (temp)
3798         return temp;
3799     }
3800
3801   if (fmt->signbit_rw < 0)
3802     return NULL_RTX;
3803   return expand_copysign_bit (mode, op0, op1, target,
3804                               fmt->signbit_rw, op0_is_abs);
3805 }
3806 \f
3807 /* Generate an instruction whose insn-code is INSN_CODE,
3808    with two operands: an output TARGET and an input OP0.
3809    TARGET *must* be nonzero, and the output is always stored there.
3810    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3811    the value that is stored into TARGET.
3812
3813    Return false if expansion failed.  */
3814
3815 bool
3816 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3817                       enum rtx_code code)
3818 {
3819   struct expand_operand ops[2];
3820   rtx pat;
3821
3822   create_output_operand (&ops[0], target, GET_MODE (target));
3823   create_input_operand (&ops[1], op0, GET_MODE (op0));
3824   pat = maybe_gen_insn (icode, 2, ops);
3825   if (!pat)
3826     return false;
3827
3828   if (INSN_P (pat) && NEXT_INSN (as_a <rtx_insn *> (pat)) != NULL_RTX
3829       && code != UNKNOWN)
3830     add_equal_note (as_a <rtx_insn *> (pat), ops[0].value, code, ops[1].value,
3831                     NULL_RTX);
3832
3833   emit_insn (pat);
3834
3835   if (ops[0].value != target)
3836     emit_move_insn (target, ops[0].value);
3837   return true;
3838 }
3839 /* Generate an instruction whose insn-code is INSN_CODE,
3840    with two operands: an output TARGET and an input OP0.
3841    TARGET *must* be nonzero, and the output is always stored there.
3842    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3843    the value that is stored into TARGET.  */
3844
3845 void
3846 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3847 {
3848   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3849   gcc_assert (ok);
3850 }
3851 \f
3852 struct no_conflict_data
3853 {
3854   rtx target;
3855   rtx_insn *first, *insn;
3856   bool must_stay;
3857 };
3858
3859 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3860    the currently examined clobber / store has to stay in the list of
3861    insns that constitute the actual libcall block.  */
3862 static void
3863 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3864 {
3865   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3866
3867   /* If this inns directly contributes to setting the target, it must stay.  */
3868   if (reg_overlap_mentioned_p (p->target, dest))
3869     p->must_stay = true;
3870   /* If we haven't committed to keeping any other insns in the list yet,
3871      there is nothing more to check.  */
3872   else if (p->insn == p->first)
3873     return;
3874   /* If this insn sets / clobbers a register that feeds one of the insns
3875      already in the list, this insn has to stay too.  */
3876   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3877            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3878            || reg_used_between_p (dest, p->first, p->insn)
3879            /* Likewise if this insn depends on a register set by a previous
3880               insn in the list, or if it sets a result (presumably a hard
3881               register) that is set or clobbered by a previous insn.
3882               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3883               SET_DEST perform the former check on the address, and the latter
3884               check on the MEM.  */
3885            || (GET_CODE (set) == SET
3886                && (modified_in_p (SET_SRC (set), p->first)
3887                    || modified_in_p (SET_DEST (set), p->first)
3888                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3889                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3890     p->must_stay = true;
3891 }
3892
3893 \f
3894 /* Emit code to make a call to a constant function or a library call.
3895
3896    INSNS is a list containing all insns emitted in the call.
3897    These insns leave the result in RESULT.  Our block is to copy RESULT
3898    to TARGET, which is logically equivalent to EQUIV.
3899
3900    We first emit any insns that set a pseudo on the assumption that these are
3901    loading constants into registers; doing so allows them to be safely cse'ed
3902    between blocks.  Then we emit all the other insns in the block, followed by
3903    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3904    note with an operand of EQUIV.  */
3905
3906 static void
3907 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3908                       bool equiv_may_trap)
3909 {
3910   rtx final_dest = target;
3911   rtx_insn *next, *last, *insn;
3912
3913   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3914      into a MEM later.  Protect the libcall block from this change.  */
3915   if (! REG_P (target) || REG_USERVAR_P (target))
3916     target = gen_reg_rtx (GET_MODE (target));
3917
3918   /* If we're using non-call exceptions, a libcall corresponding to an
3919      operation that may trap may also trap.  */
3920   /* ??? See the comment in front of make_reg_eh_region_note.  */
3921   if (cfun->can_throw_non_call_exceptions
3922       && (equiv_may_trap || may_trap_p (equiv)))
3923     {
3924       for (insn = insns; insn; insn = NEXT_INSN (insn))
3925         if (CALL_P (insn))
3926           {
3927             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3928             if (note)
3929               {
3930                 int lp_nr = INTVAL (XEXP (note, 0));
3931                 if (lp_nr == 0 || lp_nr == INT_MIN)
3932                   remove_note (insn, note);
3933               }
3934           }
3935     }
3936   else
3937     {
3938       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3939          reg note to indicate that this call cannot throw or execute a nonlocal
3940          goto (unless there is already a REG_EH_REGION note, in which case
3941          we update it).  */
3942       for (insn = insns; insn; insn = NEXT_INSN (insn))
3943         if (CALL_P (insn))
3944           make_reg_eh_region_note_nothrow_nononlocal (insn);
3945     }
3946
3947   /* First emit all insns that set pseudos.  Remove them from the list as
3948      we go.  Avoid insns that set pseudos which were referenced in previous
3949      insns.  These can be generated by move_by_pieces, for example,
3950      to update an address.  Similarly, avoid insns that reference things
3951      set in previous insns.  */
3952
3953   for (insn = insns; insn; insn = next)
3954     {
3955       rtx set = single_set (insn);
3956
3957       next = NEXT_INSN (insn);
3958
3959       if (set != 0 && REG_P (SET_DEST (set))
3960           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3961         {
3962           struct no_conflict_data data;
3963
3964           data.target = const0_rtx;
3965           data.first = insns;
3966           data.insn = insn;
3967           data.must_stay = 0;
3968           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3969           if (! data.must_stay)
3970             {
3971               if (PREV_INSN (insn))
3972                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3973               else
3974                 insns = next;
3975
3976               if (next)
3977                 SET_PREV_INSN (next) = PREV_INSN (insn);
3978
3979               add_insn (insn);
3980             }
3981         }
3982
3983       /* Some ports use a loop to copy large arguments onto the stack.
3984          Don't move anything outside such a loop.  */
3985       if (LABEL_P (insn))
3986         break;
3987     }
3988
3989   /* Write the remaining insns followed by the final copy.  */
3990   for (insn = insns; insn; insn = next)
3991     {
3992       next = NEXT_INSN (insn);
3993
3994       add_insn (insn);
3995     }
3996
3997   last = emit_move_insn (target, result);
3998   set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3999
4000   if (final_dest != target)
4001     emit_move_insn (final_dest, target);
4002 }
4003
4004 void
4005 emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
4006 {
4007   emit_libcall_block_1 (safe_as_a <rtx_insn *> (insns),
4008                         target, result, equiv, false);
4009 }
4010 \f
4011 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
4012    PURPOSE describes how this comparison will be used.  CODE is the rtx
4013    comparison code we will be using.
4014
4015    ??? Actually, CODE is slightly weaker than that.  A target is still
4016    required to implement all of the normal bcc operations, but not
4017    required to implement all (or any) of the unordered bcc operations.  */
4018
4019 int
4020 can_compare_p (enum rtx_code code, enum machine_mode mode,
4021                enum can_compare_purpose purpose)
4022 {
4023   rtx test;
4024   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
4025   do
4026     {
4027       enum insn_code icode;
4028
4029       if (purpose == ccp_jump
4030           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
4031           && insn_operand_matches (icode, 0, test))
4032         return 1;
4033       if (purpose == ccp_store_flag
4034           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
4035           && insn_operand_matches (icode, 1, test))
4036         return 1;
4037       if (purpose == ccp_cmov
4038           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
4039         return 1;
4040
4041       mode = GET_MODE_WIDER_MODE (mode);
4042       PUT_MODE (test, mode);
4043     }
4044   while (mode != VOIDmode);
4045
4046   return 0;
4047 }
4048
4049 /* This function is called when we are going to emit a compare instruction that
4050    compares the values found in *PX and *PY, using the rtl operator COMPARISON.
4051
4052    *PMODE is the mode of the inputs (in case they are const_int).
4053    *PUNSIGNEDP nonzero says that the operands are unsigned;
4054    this matters if they need to be widened (as given by METHODS).
4055
4056    If they have mode BLKmode, then SIZE specifies the size of both operands.
4057
4058    This function performs all the setup necessary so that the caller only has
4059    to emit a single comparison insn.  This setup can involve doing a BLKmode
4060    comparison or emitting a library call to perform the comparison if no insn
4061    is available to handle it.
4062    The values which are passed in through pointers can be modified; the caller
4063    should perform the comparison on the modified values.  Constant
4064    comparisons must have already been folded.  */
4065
4066 static void
4067 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
4068                   int unsignedp, enum optab_methods methods,
4069                   rtx *ptest, enum machine_mode *pmode)
4070 {
4071   enum machine_mode mode = *pmode;
4072   rtx libfunc, test;
4073   enum machine_mode cmp_mode;
4074   enum mode_class mclass;
4075
4076   /* The other methods are not needed.  */
4077   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
4078               || methods == OPTAB_LIB_WIDEN);
4079
4080   /* If we are optimizing, force expensive constants into a register.  */
4081   if (CONSTANT_P (x) && optimize
4082       && (rtx_cost (x, COMPARE, 0, optimize_insn_for_speed_p ())
4083           > COSTS_N_INSNS (1)))
4084     x = force_reg (mode, x);
4085
4086   if (CONSTANT_P (y) && optimize
4087       && (rtx_cost (y, COMPARE, 1, optimize_insn_for_speed_p ())
4088           > COSTS_N_INSNS (1)))
4089     y = force_reg (mode, y);
4090
4091 #ifdef HAVE_cc0
4092   /* Make sure if we have a canonical comparison.  The RTL
4093      documentation states that canonical comparisons are required only
4094      for targets which have cc0.  */
4095   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
4096 #endif
4097
4098   /* Don't let both operands fail to indicate the mode.  */
4099   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
4100     x = force_reg (mode, x);
4101   if (mode == VOIDmode)
4102     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
4103
4104   /* Handle all BLKmode compares.  */
4105
4106   if (mode == BLKmode)
4107     {
4108       enum machine_mode result_mode;
4109       enum insn_code cmp_code;
4110       tree length_type;
4111       rtx libfunc;
4112       rtx result;
4113       rtx opalign
4114         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
4115
4116       gcc_assert (size);
4117
4118       /* Try to use a memory block compare insn - either cmpstr
4119          or cmpmem will do.  */
4120       for (cmp_mode = GET_CLASS_NARROWEST_MODE (MODE_INT);
4121            cmp_mode != VOIDmode;
4122            cmp_mode = GET_MODE_WIDER_MODE (cmp_mode))
4123         {
4124           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
4125           if (cmp_code == CODE_FOR_nothing)
4126             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
4127           if (cmp_code == CODE_FOR_nothing)
4128             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
4129           if (cmp_code == CODE_FOR_nothing)
4130             continue;
4131
4132           /* Must make sure the size fits the insn's mode.  */
4133           if ((CONST_INT_P (size)
4134                && INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode)))
4135               || (GET_MODE_BITSIZE (GET_MODE (size))
4136                   > GET_MODE_BITSIZE (cmp_mode)))
4137             continue;
4138
4139           result_mode = insn_data[cmp_code].operand[0].mode;
4140           result = gen_reg_rtx (result_mode);
4141           size = convert_to_mode (cmp_mode, size, 1);
4142           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
4143
4144           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
4145           *pmode = result_mode;
4146           return;
4147         }
4148
4149       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
4150         goto fail;
4151
4152       /* Otherwise call a library function, memcmp.  */
4153       libfunc = memcmp_libfunc;
4154       length_type = sizetype;
4155       result_mode = TYPE_MODE (integer_type_node);
4156       cmp_mode = TYPE_MODE (length_type);
4157       size = convert_to_mode (TYPE_MODE (length_type), size,
4158                               TYPE_UNSIGNED (length_type));
4159
4160       result = emit_library_call_value (libfunc, 0, LCT_PURE,
4161                                         result_mode, 3,
4162                                         XEXP (x, 0), Pmode,
4163                                         XEXP (y, 0), Pmode,
4164                                         size, cmp_mode);
4165       x = result;
4166       y = const0_rtx;
4167       mode = result_mode;
4168       methods = OPTAB_LIB_WIDEN;
4169       unsignedp = false;
4170     }
4171
4172   /* Don't allow operands to the compare to trap, as that can put the
4173      compare and branch in different basic blocks.  */
4174   if (cfun->can_throw_non_call_exceptions)
4175     {
4176       if (may_trap_p (x))
4177         x = force_reg (mode, x);
4178       if (may_trap_p (y))
4179         y = force_reg (mode, y);
4180     }
4181
4182   if (GET_MODE_CLASS (mode) == MODE_CC)
4183     {
4184       gcc_assert (can_compare_p (comparison, CCmode, ccp_jump));
4185       *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4186       return;
4187     }
4188
4189   mclass = GET_MODE_CLASS (mode);
4190   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4191   cmp_mode = mode;
4192   do
4193    {
4194       enum insn_code icode;
4195       icode = optab_handler (cbranch_optab, cmp_mode);
4196       if (icode != CODE_FOR_nothing
4197           && insn_operand_matches (icode, 0, test))
4198         {
4199           rtx_insn *last = get_last_insn ();
4200           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
4201           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
4202           if (op0 && op1
4203               && insn_operand_matches (icode, 1, op0)
4204               && insn_operand_matches (icode, 2, op1))
4205             {
4206               XEXP (test, 0) = op0;
4207               XEXP (test, 1) = op1;
4208               *ptest = test;
4209               *pmode = cmp_mode;
4210               return;
4211             }
4212           delete_insns_since (last);
4213         }
4214
4215       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
4216         break;
4217       cmp_mode = GET_MODE_WIDER_MODE (cmp_mode);
4218     }
4219   while (cmp_mode != VOIDmode);
4220
4221   if (methods != OPTAB_LIB_WIDEN)
4222     goto fail;
4223
4224   if (!SCALAR_FLOAT_MODE_P (mode))
4225     {
4226       rtx result;
4227       enum machine_mode ret_mode;
4228
4229       /* Handle a libcall just for the mode we are using.  */
4230       libfunc = optab_libfunc (cmp_optab, mode);
4231       gcc_assert (libfunc);
4232
4233       /* If we want unsigned, and this mode has a distinct unsigned
4234          comparison routine, use that.  */
4235       if (unsignedp)
4236         {
4237           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
4238           if (ulibfunc)
4239             libfunc = ulibfunc;
4240         }
4241
4242       ret_mode = targetm.libgcc_cmp_return_mode ();
4243       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4244                                         ret_mode, 2, x, mode, y, mode);
4245
4246       /* There are two kinds of comparison routines. Biased routines
4247          return 0/1/2, and unbiased routines return -1/0/1. Other parts
4248          of gcc expect that the comparison operation is equivalent
4249          to the modified comparison. For signed comparisons compare the
4250          result against 1 in the biased case, and zero in the unbiased
4251          case. For unsigned comparisons always compare against 1 after
4252          biasing the unbiased result by adding 1. This gives us a way to
4253          represent LTU.
4254          The comparisons in the fixed-point helper library are always
4255          biased.  */
4256       x = result;
4257       y = const1_rtx;
4258
4259       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4260         {
4261           if (unsignedp)
4262             x = plus_constant (ret_mode, result, 1);
4263           else
4264             y = const0_rtx;
4265         }
4266
4267       *pmode = word_mode;
4268       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4269                         ptest, pmode);
4270     }
4271   else
4272     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
4273
4274   return;
4275
4276  fail:
4277   *ptest = NULL_RTX;
4278 }
4279
4280 /* Before emitting an insn with code ICODE, make sure that X, which is going
4281    to be used for operand OPNUM of the insn, is converted from mode MODE to
4282    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4283    that it is accepted by the operand predicate.  Return the new value.  */
4284
4285 rtx
4286 prepare_operand (enum insn_code icode, rtx x, int opnum, enum machine_mode mode,
4287                  enum machine_mode wider_mode, int unsignedp)
4288 {
4289   if (mode != wider_mode)
4290     x = convert_modes (wider_mode, mode, x, unsignedp);
4291
4292   if (!insn_operand_matches (icode, opnum, x))
4293     {
4294       if (reload_completed)
4295         return NULL_RTX;
4296       x = copy_to_mode_reg (insn_data[(int) icode].operand[opnum].mode, x);
4297     }
4298
4299   return x;
4300 }
4301
4302 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4303    we can do the branch.  */
4304
4305 static void
4306 emit_cmp_and_jump_insn_1 (rtx test, enum machine_mode mode, rtx label, int prob)
4307 {
4308   enum machine_mode optab_mode;
4309   enum mode_class mclass;
4310   enum insn_code icode;
4311   rtx_insn *insn;
4312
4313   mclass = GET_MODE_CLASS (mode);
4314   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4315   icode = optab_handler (cbranch_optab, optab_mode);
4316
4317   gcc_assert (icode != CODE_FOR_nothing);
4318   gcc_assert (insn_operand_matches (icode, 0, test));
4319   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4320                                           XEXP (test, 1), label));
4321   if (prob != -1
4322       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4323       && insn
4324       && JUMP_P (insn)
4325       && any_condjump_p (insn)
4326       && !find_reg_note (insn, REG_BR_PROB, 0))
4327     add_int_reg_note (insn, REG_BR_PROB, prob);
4328 }
4329
4330 /* Generate code to compare X with Y so that the condition codes are
4331    set and to jump to LABEL if the condition is true.  If X is a
4332    constant and Y is not a constant, then the comparison is swapped to
4333    ensure that the comparison RTL has the canonical form.
4334
4335    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4336    need to be widened.  UNSIGNEDP is also used to select the proper
4337    branch condition code.
4338
4339    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4340
4341    MODE is the mode of the inputs (in case they are const_int).
4342
4343    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4344    It will be potentially converted into an unsigned variant based on
4345    UNSIGNEDP to select a proper jump instruction.
4346
4347    PROB is the probability of jumping to LABEL.  */
4348
4349 void
4350 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4351                          enum machine_mode mode, int unsignedp, rtx label,
4352                          int prob)
4353 {
4354   rtx op0 = x, op1 = y;
4355   rtx test;
4356
4357   /* Swap operands and condition to ensure canonical RTL.  */
4358   if (swap_commutative_operands_p (x, y)
4359       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4360     {
4361       op0 = y, op1 = x;
4362       comparison = swap_condition (comparison);
4363     }
4364
4365   /* If OP0 is still a constant, then both X and Y must be constants
4366      or the opposite comparison is not supported.  Force X into a register
4367      to create canonical RTL.  */
4368   if (CONSTANT_P (op0))
4369     op0 = force_reg (mode, op0);
4370
4371   if (unsignedp)
4372     comparison = unsigned_condition (comparison);
4373
4374   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4375                     &test, &mode);
4376   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4377 }
4378
4379 \f
4380 /* Emit a library call comparison between floating point X and Y.
4381    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4382
4383 static void
4384 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4385                        rtx *ptest, enum machine_mode *pmode)
4386 {
4387   enum rtx_code swapped = swap_condition (comparison);
4388   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4389   enum machine_mode orig_mode = GET_MODE (x);
4390   enum machine_mode mode, cmp_mode;
4391   rtx true_rtx, false_rtx;
4392   rtx value, target, equiv;
4393   rtx_insn *insns;
4394   rtx libfunc = 0;
4395   bool reversed_p = false;
4396   cmp_mode = targetm.libgcc_cmp_return_mode ();
4397
4398   for (mode = orig_mode;
4399        mode != VOIDmode;
4400        mode = GET_MODE_WIDER_MODE (mode))
4401     {
4402       if (code_to_optab (comparison)
4403           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4404         break;
4405
4406       if (code_to_optab (swapped)
4407           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4408         {
4409           rtx tmp;
4410           tmp = x; x = y; y = tmp;
4411           comparison = swapped;
4412           break;
4413         }
4414
4415       if (code_to_optab (reversed)
4416           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4417         {
4418           comparison = reversed;
4419           reversed_p = true;
4420           break;
4421         }
4422     }
4423
4424   gcc_assert (mode != VOIDmode);
4425
4426   if (mode != orig_mode)
4427     {
4428       x = convert_to_mode (mode, x, 0);
4429       y = convert_to_mode (mode, y, 0);
4430     }
4431
4432   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4433      the RTL.  The allows the RTL optimizers to delete the libcall if the
4434      condition can be determined at compile-time.  */
4435   if (comparison == UNORDERED
4436       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4437     {
4438       true_rtx = const_true_rtx;
4439       false_rtx = const0_rtx;
4440     }
4441   else
4442     {
4443       switch (comparison)
4444         {
4445         case EQ:
4446           true_rtx = const0_rtx;
4447           false_rtx = const_true_rtx;
4448           break;
4449
4450         case NE:
4451           true_rtx = const_true_rtx;
4452           false_rtx = const0_rtx;
4453           break;
4454
4455         case GT:
4456           true_rtx = const1_rtx;
4457           false_rtx = const0_rtx;
4458           break;
4459
4460         case GE:
4461           true_rtx = const0_rtx;
4462           false_rtx = constm1_rtx;
4463           break;
4464
4465         case LT:
4466           true_rtx = constm1_rtx;
4467           false_rtx = const0_rtx;
4468           break;
4469
4470         case LE:
4471           true_rtx = const0_rtx;
4472           false_rtx = const1_rtx;
4473           break;
4474
4475         default:
4476           gcc_unreachable ();
4477         }
4478     }
4479
4480   if (comparison == UNORDERED)
4481     {
4482       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4483       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4484       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4485                                     temp, const_true_rtx, equiv);
4486     }
4487   else
4488     {
4489       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4490       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4491         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4492                                       equiv, true_rtx, false_rtx);
4493     }
4494
4495   start_sequence ();
4496   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4497                                    cmp_mode, 2, x, mode, y, mode);
4498   insns = get_insns ();
4499   end_sequence ();
4500
4501   target = gen_reg_rtx (cmp_mode);
4502   emit_libcall_block (insns, target, value, equiv);
4503
4504   if (comparison == UNORDERED
4505       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4506       || reversed_p)
4507     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4508   else
4509     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4510
4511   *pmode = cmp_mode;
4512 }
4513 \f
4514 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4515
4516 void
4517 emit_indirect_jump (rtx loc)
4518 {
4519   struct expand_operand ops[1];
4520
4521   create_address_operand (&ops[0], loc);
4522   expand_jump_insn (CODE_FOR_indirect_jump, 1, ops);
4523   emit_barrier ();
4524 }
4525 \f
4526 #ifdef HAVE_conditional_move
4527
4528 /* Emit a conditional move instruction if the machine supports one for that
4529    condition and machine mode.
4530
4531    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4532    the mode to use should they be constants.  If it is VOIDmode, they cannot
4533    both be constants.
4534
4535    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4536    should be stored there.  MODE is the mode to use should they be constants.
4537    If it is VOIDmode, they cannot both be constants.
4538
4539    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4540    is not supported.  */
4541
4542 rtx
4543 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4544                        enum machine_mode cmode, rtx op2, rtx op3,
4545                        enum machine_mode mode, int unsignedp)
4546 {
4547   rtx tem, comparison;
4548   rtx_insn *last;
4549   enum insn_code icode;
4550   enum rtx_code reversed;
4551
4552   /* If one operand is constant, make it the second one.  Only do this
4553      if the other operand is not constant as well.  */
4554
4555   if (swap_commutative_operands_p (op0, op1))
4556     {
4557       tem = op0;
4558       op0 = op1;
4559       op1 = tem;
4560       code = swap_condition (code);
4561     }
4562
4563   /* get_condition will prefer to generate LT and GT even if the old
4564      comparison was against zero, so undo that canonicalization here since
4565      comparisons against zero are cheaper.  */
4566   if (code == LT && op1 == const1_rtx)
4567     code = LE, op1 = const0_rtx;
4568   else if (code == GT && op1 == constm1_rtx)
4569     code = GE, op1 = const0_rtx;
4570
4571   if (cmode == VOIDmode)
4572     cmode = GET_MODE (op0);
4573
4574   if (swap_commutative_operands_p (op2, op3)
4575       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4576           != UNKNOWN))
4577     {
4578       tem = op2;
4579       op2 = op3;
4580       op3 = tem;
4581       code = reversed;
4582     }
4583
4584   if (mode == VOIDmode)
4585     mode = GET_MODE (op2);
4586
4587   icode = direct_optab_handler (movcc_optab, mode);
4588
4589   if (icode == CODE_FOR_nothing)
4590     return 0;
4591
4592   if (!target)
4593     target = gen_reg_rtx (mode);
4594
4595   code = unsignedp ? unsigned_condition (code) : code;
4596   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4597
4598   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4599      return NULL and let the caller figure out how best to deal with this
4600      situation.  */
4601   if (!COMPARISON_P (comparison))
4602     return NULL_RTX;
4603
4604   saved_pending_stack_adjust save;
4605   save_pending_stack_adjust (&save);
4606   last = get_last_insn ();
4607   do_pending_stack_adjust ();
4608   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4609                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4610                     &comparison, &cmode);
4611   if (comparison)
4612     {
4613       struct expand_operand ops[4];
4614
4615       create_output_operand (&ops[0], target, mode);
4616       create_fixed_operand (&ops[1], comparison);
4617       create_input_operand (&ops[2], op2, mode);
4618       create_input_operand (&ops[3], op3, mode);
4619       if (maybe_expand_insn (icode, 4, ops))
4620         {
4621           if (ops[0].value != target)
4622             convert_move (target, ops[0].value, false);
4623           return target;
4624         }
4625     }
4626   delete_insns_since (last);
4627   restore_pending_stack_adjust (&save);
4628   return NULL_RTX;
4629 }
4630
4631 /* Return nonzero if a conditional move of mode MODE is supported.
4632
4633    This function is for combine so it can tell whether an insn that looks
4634    like a conditional move is actually supported by the hardware.  If we
4635    guess wrong we lose a bit on optimization, but that's it.  */
4636 /* ??? sparc64 supports conditionally moving integers values based on fp
4637    comparisons, and vice versa.  How do we handle them?  */
4638
4639 int
4640 can_conditionally_move_p (enum machine_mode mode)
4641 {
4642   if (direct_optab_handler (movcc_optab, mode) != CODE_FOR_nothing)
4643     return 1;
4644
4645   return 0;
4646 }
4647
4648 #endif /* HAVE_conditional_move */
4649
4650 /* Emit a conditional addition instruction if the machine supports one for that
4651    condition and machine mode.
4652
4653    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4654    the mode to use should they be constants.  If it is VOIDmode, they cannot
4655    both be constants.
4656
4657    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4658    should be stored there.  MODE is the mode to use should they be constants.
4659    If it is VOIDmode, they cannot both be constants.
4660
4661    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4662    is not supported.  */
4663
4664 rtx
4665 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4666                       enum machine_mode cmode, rtx op2, rtx op3,
4667                       enum machine_mode mode, int unsignedp)
4668 {
4669   rtx tem, comparison;
4670   rtx_insn *last;
4671   enum insn_code icode;
4672
4673   /* If one operand is constant, make it the second one.  Only do this
4674      if the other operand is not constant as well.  */
4675
4676   if (swap_commutative_operands_p (op0, op1))
4677     {
4678       tem = op0;
4679       op0 = op1;
4680       op1 = tem;
4681       code = swap_condition (code);
4682     }
4683
4684   /* get_condition will prefer to generate LT and GT even if the old
4685      comparison was against zero, so undo that canonicalization here since
4686      comparisons against zero are cheaper.  */
4687   if (code == LT && op1 == const1_rtx)
4688     code = LE, op1 = const0_rtx;
4689   else if (code == GT && op1 == constm1_rtx)
4690     code = GE, op1 = const0_rtx;
4691
4692   if (cmode == VOIDmode)
4693     cmode = GET_MODE (op0);
4694
4695   if (mode == VOIDmode)
4696     mode = GET_MODE (op2);
4697
4698   icode = optab_handler (addcc_optab, mode);
4699
4700   if (icode == CODE_FOR_nothing)
4701     return 0;
4702
4703   if (!target)
4704     target = gen_reg_rtx (mode);
4705
4706   code = unsignedp ? unsigned_condition (code) : code;
4707   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4708
4709   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4710      return NULL and let the caller figure out how best to deal with this
4711      situation.  */
4712   if (!COMPARISON_P (comparison))
4713     return NULL_RTX;
4714
4715   do_pending_stack_adjust ();
4716   last = get_last_insn ();
4717   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4718                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4719                     &comparison, &cmode);
4720   if (comparison)
4721     {
4722       struct expand_operand ops[4];
4723
4724       create_output_operand (&ops[0], target, mode);
4725       create_fixed_operand (&ops[1], comparison);
4726       create_input_operand (&ops[2], op2, mode);
4727       create_input_operand (&ops[3], op3, mode);
4728       if (maybe_expand_insn (icode, 4, ops))
4729         {
4730           if (ops[0].value != target)
4731             convert_move (target, ops[0].value, false);
4732           return target;
4733         }
4734     }
4735   delete_insns_since (last);
4736   return NULL_RTX;
4737 }
4738 \f
4739 /* These functions attempt to generate an insn body, rather than
4740    emitting the insn, but if the gen function already emits them, we
4741    make no attempt to turn them back into naked patterns.  */
4742
4743 /* Generate and return an insn body to add Y to X.  */
4744
4745 rtx
4746 gen_add2_insn (rtx x, rtx y)
4747 {
4748   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4749
4750   gcc_assert (insn_operand_matches (icode, 0, x));
4751   gcc_assert (insn_operand_matches (icode, 1, x));
4752   gcc_assert (insn_operand_matches (icode, 2, y));
4753
4754   return GEN_FCN (icode) (x, x, y);
4755 }
4756
4757 /* Generate and return an insn body to add r1 and c,
4758    storing the result in r0.  */
4759
4760 rtx
4761 gen_add3_insn (rtx r0, rtx r1, rtx c)
4762 {
4763   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4764
4765   if (icode == CODE_FOR_nothing
4766       || !insn_operand_matches (icode, 0, r0)
4767       || !insn_operand_matches (icode, 1, r1)
4768       || !insn_operand_matches (icode, 2, c))
4769     return NULL_RTX;
4770
4771   return GEN_FCN (icode) (r0, r1, c);
4772 }
4773
4774 int
4775 have_add2_insn (rtx x, rtx y)
4776 {
4777   enum insn_code icode;
4778
4779   gcc_assert (GET_MODE (x) != VOIDmode);
4780
4781   icode = optab_handler (add_optab, GET_MODE (x));
4782
4783   if (icode == CODE_FOR_nothing)
4784     return 0;
4785
4786   if (!insn_operand_matches (icode, 0, x)
4787       || !insn_operand_matches (icode, 1, x)
4788       || !insn_operand_matches (icode, 2, y))
4789     return 0;
4790
4791   return 1;
4792 }
4793
4794 /* Generate and return an insn body to add Y to X.  */
4795
4796 rtx
4797 gen_addptr3_insn (rtx x, rtx y, rtx z)
4798 {
4799   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4800
4801   gcc_assert (insn_operand_matches (icode, 0, x));
4802   gcc_assert (insn_operand_matches (icode, 1, y));
4803   gcc_assert (insn_operand_matches (icode, 2, z));
4804
4805   return GEN_FCN (icode) (x, y, z);
4806 }
4807
4808 /* Return true if the target implements an addptr pattern and X, Y,
4809    and Z are valid for the pattern predicates.  */
4810
4811 int
4812 have_addptr3_insn (rtx x, rtx y, rtx z)
4813 {
4814   enum insn_code icode;
4815
4816   gcc_assert (GET_MODE (x) != VOIDmode);
4817
4818   icode = optab_handler (addptr3_optab, GET_MODE (x));
4819
4820   if (icode == CODE_FOR_nothing)
4821     return 0;
4822
4823   if (!insn_operand_matches (icode, 0, x)
4824       || !insn_operand_matches (icode, 1, y)
4825       || !insn_operand_matches (icode, 2, z))
4826     return 0;
4827
4828   return 1;
4829 }
4830
4831 /* Generate and return an insn body to subtract Y from X.  */
4832
4833 rtx
4834 gen_sub2_insn (rtx x, rtx y)
4835 {
4836   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4837
4838   gcc_assert (insn_operand_matches (icode, 0, x));
4839   gcc_assert (insn_operand_matches (icode, 1, x));
4840   gcc_assert (insn_operand_matches (icode, 2, y));
4841
4842   return GEN_FCN (icode) (x, x, y);
4843 }
4844
4845 /* Generate and return an insn body to subtract r1 and c,
4846    storing the result in r0.  */
4847
4848 rtx
4849 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4850 {
4851   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4852
4853   if (icode == CODE_FOR_nothing
4854       || !insn_operand_matches (icode, 0, r0)
4855       || !insn_operand_matches (icode, 1, r1)
4856       || !insn_operand_matches (icode, 2, c))
4857     return NULL_RTX;
4858
4859   return GEN_FCN (icode) (r0, r1, c);
4860 }
4861
4862 int
4863 have_sub2_insn (rtx x, rtx y)
4864 {
4865   enum insn_code icode;
4866
4867   gcc_assert (GET_MODE (x) != VOIDmode);
4868
4869   icode = optab_handler (sub_optab, GET_MODE (x));
4870
4871   if (icode == CODE_FOR_nothing)
4872     return 0;
4873
4874   if (!insn_operand_matches (icode, 0, x)
4875       || !insn_operand_matches (icode, 1, x)
4876       || !insn_operand_matches (icode, 2, y))
4877     return 0;
4878
4879   return 1;
4880 }
4881
4882 /* Generate the body of an instruction to copy Y into X.
4883    It may be a list of insns, if one insn isn't enough.  */
4884
4885 rtx
4886 gen_move_insn (rtx x, rtx y)
4887 {
4888   rtx_insn *seq;
4889
4890   start_sequence ();
4891   emit_move_insn_1 (x, y);
4892   seq = get_insns ();
4893   end_sequence ();
4894   return seq;
4895 }
4896 \f
4897 /* Return the insn code used to extend FROM_MODE to TO_MODE.
4898    UNSIGNEDP specifies zero-extension instead of sign-extension.  If
4899    no such operation exists, CODE_FOR_nothing will be returned.  */
4900
4901 enum insn_code
4902 can_extend_p (enum machine_mode to_mode, enum machine_mode from_mode,
4903               int unsignedp)
4904 {
4905   convert_optab tab;
4906 #ifdef HAVE_ptr_extend
4907   if (unsignedp < 0)
4908     return CODE_FOR_ptr_extend;
4909 #endif
4910
4911   tab = unsignedp ? zext_optab : sext_optab;
4912   return convert_optab_handler (tab, to_mode, from_mode);
4913 }
4914
4915 /* Generate the body of an insn to extend Y (with mode MFROM)
4916    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4917
4918 rtx
4919 gen_extend_insn (rtx x, rtx y, enum machine_mode mto,
4920                  enum machine_mode mfrom, int unsignedp)
4921 {
4922   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4923   return GEN_FCN (icode) (x, y);
4924 }
4925 \f
4926 /* can_fix_p and can_float_p say whether the target machine
4927    can directly convert a given fixed point type to
4928    a given floating point type, or vice versa.
4929    The returned value is the CODE_FOR_... value to use,
4930    or CODE_FOR_nothing if these modes cannot be directly converted.
4931
4932    *TRUNCP_PTR is set to 1 if it is necessary to output
4933    an explicit FTRUNC insn before the fix insn; otherwise 0.  */
4934
4935 static enum insn_code
4936 can_fix_p (enum machine_mode fixmode, enum machine_mode fltmode,
4937            int unsignedp, int *truncp_ptr)
4938 {
4939   convert_optab tab;
4940   enum insn_code icode;
4941
4942   tab = unsignedp ? ufixtrunc_optab : sfixtrunc_optab;
4943   icode = convert_optab_handler (tab, fixmode, fltmode);
4944   if (icode != CODE_FOR_nothing)
4945     {
4946       *truncp_ptr = 0;
4947       return icode;
4948     }
4949
4950   /* FIXME: This requires a port to define both FIX and FTRUNC pattern
4951      for this to work. We need to rework the fix* and ftrunc* patterns
4952      and documentation.  */
4953   tab = unsignedp ? ufix_optab : sfix_optab;
4954   icode = convert_optab_handler (tab, fixmode, fltmode);
4955   if (icode != CODE_FOR_nothing
4956       && optab_handler (ftrunc_optab, fltmode) != CODE_FOR_nothing)
4957     {
4958       *truncp_ptr = 1;
4959       return icode;
4960     }
4961
4962   *truncp_ptr = 0;
4963   return CODE_FOR_nothing;
4964 }
4965
4966 enum insn_code
4967 can_float_p (enum machine_mode fltmode, enum machine_mode fixmode,
4968              int unsignedp)
4969 {
4970   convert_optab tab;
4971
4972   tab = unsignedp ? ufloat_optab : sfloat_optab;
4973   return convert_optab_handler (tab, fltmode, fixmode);
4974 }
4975
4976 /* Function supportable_convert_operation
4977
4978    Check whether an operation represented by the code CODE is a
4979    convert operation that is supported by the target platform in
4980    vector form (i.e., when operating on arguments of type VECTYPE_IN
4981    producing a result of type VECTYPE_OUT).
4982
4983    Convert operations we currently support directly are FIX_TRUNC and FLOAT.
4984    This function checks if these operations are supported
4985    by the target platform either directly (via vector tree-codes), or via
4986    target builtins.
4987
4988    Output:
4989    - CODE1 is code of vector operation to be used when
4990    vectorizing the operation, if available.
4991    - DECL is decl of target builtin functions to be used
4992    when vectorizing the operation, if available.  In this case,
4993    CODE1 is CALL_EXPR.  */
4994
4995 bool
4996 supportable_convert_operation (enum tree_code code,
4997                                     tree vectype_out, tree vectype_in,
4998                                     tree *decl, enum tree_code *code1)
4999 {
5000   enum machine_mode m1,m2;
5001   int truncp;
5002
5003   m1 = TYPE_MODE (vectype_out);
5004   m2 = TYPE_MODE (vectype_in);
5005
5006   /* First check if we can done conversion directly.  */
5007   if ((code == FIX_TRUNC_EXPR
5008        && can_fix_p (m1,m2,TYPE_UNSIGNED (vectype_out), &truncp)
5009           != CODE_FOR_nothing)
5010       || (code == FLOAT_EXPR
5011           && can_float_p (m1,m2,TYPE_UNSIGNED (vectype_in))
5012              != CODE_FOR_nothing))
5013     {
5014       *code1 = code;
5015       return true;
5016     }
5017
5018   /* Now check for builtin.  */
5019   if (targetm.vectorize.builtin_conversion
5020       && targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in))
5021     {
5022       *code1 = CALL_EXPR;
5023       *decl = targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in);
5024       return true;
5025     }
5026   return false;
5027 }
5028
5029 \f
5030 /* Generate code to convert FROM to floating point
5031    and store in TO.  FROM must be fixed point and not VOIDmode.
5032    UNSIGNEDP nonzero means regard FROM as unsigned.
5033    Normally this is done by correcting the final value
5034    if it is negative.  */
5035
5036 void
5037 expand_float (rtx to, rtx from, int unsignedp)
5038 {
5039   enum insn_code icode;
5040   rtx target = to;
5041   enum machine_mode fmode, imode;
5042   bool can_do_signed = false;
5043
5044   /* Crash now, because we won't be able to decide which mode to use.  */
5045   gcc_assert (GET_MODE (from) != VOIDmode);
5046
5047   /* Look for an insn to do the conversion.  Do it in the specified
5048      modes if possible; otherwise convert either input, output or both to
5049      wider mode.  If the integer mode is wider than the mode of FROM,
5050      we can do the conversion signed even if the input is unsigned.  */
5051
5052   for (fmode = GET_MODE (to); fmode != VOIDmode;
5053        fmode = GET_MODE_WIDER_MODE (fmode))
5054     for (imode = GET_MODE (from); imode != VOIDmode;
5055          imode = GET_MODE_WIDER_MODE (imode))
5056       {
5057         int doing_unsigned = unsignedp;
5058
5059         if (fmode != GET_MODE (to)
5060             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
5061           continue;
5062
5063         icode = can_float_p (fmode, imode, unsignedp);
5064         if (icode == CODE_FOR_nothing && unsignedp)
5065           {
5066             enum insn_code scode = can_float_p (fmode, imode, 0);
5067             if (scode != CODE_FOR_nothing)
5068               can_do_signed = true;
5069             if (imode != GET_MODE (from))
5070               icode = scode, doing_unsigned = 0;
5071           }
5072
5073         if (icode != CODE_FOR_nothing)
5074           {
5075             if (imode != GET_MODE (from))
5076               from = convert_to_mode (imode, from, unsignedp);
5077
5078             if (fmode != GET_MODE (to))
5079               target = gen_reg_rtx (fmode);
5080
5081             emit_unop_insn (icode, target, from,
5082                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
5083
5084             if (target != to)
5085               convert_move (to, target, 0);
5086             return;
5087           }
5088       }
5089
5090   /* Unsigned integer, and no way to convert directly.  Convert as signed,
5091      then unconditionally adjust the result.  */
5092   if (unsignedp && can_do_signed)
5093     {
5094       rtx_code_label *label = gen_label_rtx ();
5095       rtx temp;
5096       REAL_VALUE_TYPE offset;
5097
5098       /* Look for a usable floating mode FMODE wider than the source and at
5099          least as wide as the target.  Using FMODE will avoid rounding woes
5100          with unsigned values greater than the signed maximum value.  */
5101
5102       for (fmode = GET_MODE (to);  fmode != VOIDmode;
5103            fmode = GET_MODE_WIDER_MODE (fmode))
5104         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
5105             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
5106           break;
5107
5108       if (fmode == VOIDmode)
5109         {
5110           /* There is no such mode.  Pretend the target is wide enough.  */
5111           fmode = GET_MODE (to);
5112
5113           /* Avoid double-rounding when TO is narrower than FROM.  */
5114           if ((significand_size (fmode) + 1)
5115               < GET_MODE_PRECISION (GET_MODE (from)))
5116             {
5117               rtx temp1;
5118               rtx_code_label *neglabel = gen_label_rtx ();
5119
5120               /* Don't use TARGET if it isn't a register, is a hard register,
5121                  or is the wrong mode.  */
5122               if (!REG_P (target)
5123                   || REGNO (target) < FIRST_PSEUDO_REGISTER
5124                   || GET_MODE (target) != fmode)
5125                 target = gen_reg_rtx (fmode);
5126
5127               imode = GET_MODE (from);
5128               do_pending_stack_adjust ();
5129
5130               /* Test whether the sign bit is set.  */
5131               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
5132                                        0, neglabel);
5133
5134               /* The sign bit is not set.  Convert as signed.  */
5135               expand_float (target, from, 0);
5136               emit_jump_insn (gen_jump (label));
5137               emit_barrier ();
5138
5139               /* The sign bit is set.
5140                  Convert to a usable (positive signed) value by shifting right
5141                  one bit, while remembering if a nonzero bit was shifted
5142                  out; i.e., compute  (from & 1) | (from >> 1).  */
5143
5144               emit_label (neglabel);
5145               temp = expand_binop (imode, and_optab, from, const1_rtx,
5146                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
5147               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
5148               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
5149                                    OPTAB_LIB_WIDEN);
5150               expand_float (target, temp, 0);
5151
5152               /* Multiply by 2 to undo the shift above.  */
5153               temp = expand_binop (fmode, add_optab, target, target,
5154                                    target, 0, OPTAB_LIB_WIDEN);
5155               if (temp != target)
5156                 emit_move_insn (target, temp);
5157
5158               do_pending_stack_adjust ();
5159               emit_label (label);
5160               goto done;
5161             }
5162         }
5163
5164       /* If we are about to do some arithmetic to correct for an
5165          unsigned operand, do it in a pseudo-register.  */
5166
5167       if (GET_MODE (to) != fmode
5168           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
5169         target = gen_reg_rtx (fmode);
5170
5171       /* Convert as signed integer to floating.  */
5172       expand_float (target, from, 0);
5173
5174       /* If FROM is negative (and therefore TO is negative),
5175          correct its value by 2**bitwidth.  */
5176
5177       do_pending_stack_adjust ();
5178       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
5179                                0, label);
5180
5181
5182       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
5183       temp = expand_binop (fmode, add_optab, target,
5184                            CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode),
5185                            target, 0, OPTAB_LIB_WIDEN);
5186       if (temp != target)
5187         emit_move_insn (target, temp);
5188
5189       do_pending_stack_adjust ();
5190       emit_label (label);
5191       goto done;
5192     }
5193
5194   /* No hardware instruction available; call a library routine.  */
5195     {
5196       rtx libfunc;
5197       rtx_insn *insns;
5198       rtx value;
5199       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
5200
5201       if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_PRECISION (SImode))
5202         from = convert_to_mode (SImode, from, unsignedp);
5203
5204       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5205       gcc_assert (libfunc);
5206
5207       start_sequence ();
5208
5209       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5210                                        GET_MODE (to), 1, from,
5211                                        GET_MODE (from));
5212       insns = get_insns ();
5213       end_sequence ();
5214
5215       emit_libcall_block (insns, target, value,
5216                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
5217                                          GET_MODE (to), from));
5218     }
5219
5220  done:
5221
5222   /* Copy result to requested destination
5223      if we have been computing in a temp location.  */
5224
5225   if (target != to)
5226     {
5227       if (GET_MODE (target) == GET_MODE (to))
5228         emit_move_insn (to, target);
5229       else
5230         convert_move (to, target, 0);
5231     }
5232 }
5233 \f
5234 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5235    must be floating point.  */
5236
5237 void
5238 expand_fix (rtx to, rtx from, int unsignedp)
5239 {
5240   enum insn_code icode;
5241   rtx target = to;
5242   enum machine_mode fmode, imode;
5243   int must_trunc = 0;
5244
5245   /* We first try to find a pair of modes, one real and one integer, at
5246      least as wide as FROM and TO, respectively, in which we can open-code
5247      this conversion.  If the integer mode is wider than the mode of TO,
5248      we can do the conversion either signed or unsigned.  */
5249
5250   for (fmode = GET_MODE (from); fmode != VOIDmode;
5251        fmode = GET_MODE_WIDER_MODE (fmode))
5252     for (imode = GET_MODE (to); imode != VOIDmode;
5253          imode = GET_MODE_WIDER_MODE (imode))
5254       {
5255         int doing_unsigned = unsignedp;
5256
5257         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
5258         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
5259           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
5260
5261         if (icode != CODE_FOR_nothing)
5262           {
5263             rtx_insn *last = get_last_insn ();
5264             if (fmode != GET_MODE (from))
5265               from = convert_to_mode (fmode, from, 0);
5266
5267             if (must_trunc)
5268               {
5269                 rtx temp = gen_reg_rtx (GET_MODE (from));
5270                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
5271                                     temp, 0);
5272               }
5273
5274             if (imode != GET_MODE (to))
5275               target = gen_reg_rtx (imode);
5276
5277             if (maybe_emit_unop_insn (icode, target, from,
5278                                       doing_unsigned ? UNSIGNED_FIX : FIX))
5279               {
5280                 if (target != to)
5281                   convert_move (to, target, unsignedp);
5282                 return;
5283               }
5284             delete_insns_since (last);
5285           }
5286       }
5287
5288   /* For an unsigned conversion, there is one more way to do it.
5289      If we have a signed conversion, we generate code that compares
5290      the real value to the largest representable positive number.  If if
5291      is smaller, the conversion is done normally.  Otherwise, subtract
5292      one plus the highest signed number, convert, and add it back.
5293
5294      We only need to check all real modes, since we know we didn't find
5295      anything with a wider integer mode.
5296
5297      This code used to extend FP value into mode wider than the destination.
5298      This is needed for decimal float modes which cannot accurately
5299      represent one plus the highest signed number of the same size, but
5300      not for binary modes.  Consider, for instance conversion from SFmode
5301      into DImode.
5302
5303      The hot path through the code is dealing with inputs smaller than 2^63
5304      and doing just the conversion, so there is no bits to lose.
5305
5306      In the other path we know the value is positive in the range 2^63..2^64-1
5307      inclusive.  (as for other input overflow happens and result is undefined)
5308      So we know that the most important bit set in mantissa corresponds to
5309      2^63.  The subtraction of 2^63 should not generate any rounding as it
5310      simply clears out that bit.  The rest is trivial.  */
5311
5312   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
5313     for (fmode = GET_MODE (from); fmode != VOIDmode;
5314          fmode = GET_MODE_WIDER_MODE (fmode))
5315       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
5316           && (!DECIMAL_FLOAT_MODE_P (fmode)
5317               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
5318         {
5319           int bitsize;
5320           REAL_VALUE_TYPE offset;
5321           rtx limit;
5322           rtx_code_label *lab1, *lab2;
5323           rtx_insn *insn;
5324
5325           bitsize = GET_MODE_PRECISION (GET_MODE (to));
5326           real_2expN (&offset, bitsize - 1, fmode);
5327           limit = CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode);
5328           lab1 = gen_label_rtx ();
5329           lab2 = gen_label_rtx ();
5330
5331           if (fmode != GET_MODE (from))
5332             from = convert_to_mode (fmode, from, 0);
5333
5334           /* See if we need to do the subtraction.  */
5335           do_pending_stack_adjust ();
5336           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
5337                                    0, lab1);
5338
5339           /* If not, do the signed "fix" and branch around fixup code.  */
5340           expand_fix (to, from, 0);
5341           emit_jump_insn (gen_jump (lab2));
5342           emit_barrier ();
5343
5344           /* Otherwise, subtract 2**(N-1), convert to signed number,
5345              then add 2**(N-1).  Do the addition using XOR since this
5346              will often generate better code.  */
5347           emit_label (lab1);
5348           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5349                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
5350           expand_fix (to, target, 0);
5351           target = expand_binop (GET_MODE (to), xor_optab, to,
5352                                  gen_int_mode
5353                                  ((HOST_WIDE_INT) 1 << (bitsize - 1),
5354                                   GET_MODE (to)),
5355                                  to, 1, OPTAB_LIB_WIDEN);
5356
5357           if (target != to)
5358             emit_move_insn (to, target);
5359
5360           emit_label (lab2);
5361
5362           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
5363             {
5364               /* Make a place for a REG_NOTE and add it.  */
5365               insn = emit_move_insn (to, to);
5366               set_dst_reg_note (insn, REG_EQUAL,
5367                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
5368                                                copy_rtx (from)),
5369                                 to);
5370             }
5371
5372           return;
5373         }
5374
5375   /* We can't do it with an insn, so use a library call.  But first ensure
5376      that the mode of TO is at least as wide as SImode, since those are the
5377      only library calls we know about.  */
5378
5379   if (GET_MODE_PRECISION (GET_MODE (to)) < GET_MODE_PRECISION (SImode))
5380     {
5381       target = gen_reg_rtx (SImode);
5382
5383       expand_fix (target, from, unsignedp);
5384     }
5385   else
5386     {
5387       rtx_insn *insns;
5388       rtx value;
5389       rtx libfunc;
5390
5391       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5392       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5393       gcc_assert (libfunc);
5394
5395       start_sequence ();
5396
5397       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5398                                        GET_MODE (to), 1, from,
5399                                        GET_MODE (from));
5400       insns = get_insns ();
5401       end_sequence ();
5402
5403       emit_libcall_block (insns, target, value,
5404                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5405                                          GET_MODE (to), from));
5406     }
5407
5408   if (target != to)
5409     {
5410       if (GET_MODE (to) == GET_MODE (target))
5411         emit_move_insn (to, target);
5412       else
5413         convert_move (to, target, 0);
5414     }
5415 }
5416
5417 /* Generate code to convert FROM or TO a fixed-point.
5418    If UINTP is true, either TO or FROM is an unsigned integer.
5419    If SATP is true, we need to saturate the result.  */
5420
5421 void
5422 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5423 {
5424   enum machine_mode to_mode = GET_MODE (to);
5425   enum machine_mode from_mode = GET_MODE (from);
5426   convert_optab tab;
5427   enum rtx_code this_code;
5428   enum insn_code code;
5429   rtx_insn *insns;
5430   rtx value;
5431   rtx libfunc;
5432
5433   if (to_mode == from_mode)
5434     {
5435       emit_move_insn (to, from);
5436       return;
5437     }
5438
5439   if (uintp)
5440     {
5441       tab = satp ? satfractuns_optab : fractuns_optab;
5442       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5443     }
5444   else
5445     {
5446       tab = satp ? satfract_optab : fract_optab;
5447       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5448     }
5449   code = convert_optab_handler (tab, to_mode, from_mode);
5450   if (code != CODE_FOR_nothing)
5451     {
5452       emit_unop_insn (code, to, from, this_code);
5453       return;
5454     }
5455
5456   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5457   gcc_assert (libfunc);
5458
5459   start_sequence ();
5460   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5461                                    1, from, from_mode);
5462   insns = get_insns ();
5463   end_sequence ();
5464
5465   emit_libcall_block (insns, to, value,
5466                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5467 }
5468
5469 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5470    must be floating point, TO must be signed.  Use the conversion optab
5471    TAB to do the conversion.  */
5472
5473 bool
5474 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5475 {
5476   enum insn_code icode;
5477   rtx target = to;
5478   enum machine_mode fmode, imode;
5479
5480   /* We first try to find a pair of modes, one real and one integer, at
5481      least as wide as FROM and TO, respectively, in which we can open-code
5482      this conversion.  If the integer mode is wider than the mode of TO,
5483      we can do the conversion either signed or unsigned.  */
5484
5485   for (fmode = GET_MODE (from); fmode != VOIDmode;
5486        fmode = GET_MODE_WIDER_MODE (fmode))
5487     for (imode = GET_MODE (to); imode != VOIDmode;
5488          imode = GET_MODE_WIDER_MODE (imode))
5489       {
5490         icode = convert_optab_handler (tab, imode, fmode);
5491         if (icode != CODE_FOR_nothing)
5492           {
5493             rtx_insn *last = get_last_insn ();
5494             if (fmode != GET_MODE (from))
5495               from = convert_to_mode (fmode, from, 0);
5496
5497             if (imode != GET_MODE (to))
5498               target = gen_reg_rtx (imode);
5499
5500             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5501               {
5502                 delete_insns_since (last);
5503                 continue;
5504               }
5505             if (target != to)
5506               convert_move (to, target, 0);
5507             return true;
5508           }
5509       }
5510
5511   return false;
5512 }
5513 \f
5514 /* Report whether we have an instruction to perform the operation
5515    specified by CODE on operands of mode MODE.  */
5516 int
5517 have_insn_for (enum rtx_code code, enum machine_mode mode)
5518 {
5519   return (code_to_optab (code)
5520           && (optab_handler (code_to_optab (code), mode)
5521               != CODE_FOR_nothing));
5522 }
5523
5524 /* Initialize the libfunc fields of an entire group of entries in some
5525    optab.  Each entry is set equal to a string consisting of a leading
5526    pair of underscores followed by a generic operation name followed by
5527    a mode name (downshifted to lowercase) followed by a single character
5528    representing the number of operands for the given operation (which is
5529    usually one of the characters '2', '3', or '4').
5530
5531    OPTABLE is the table in which libfunc fields are to be initialized.
5532    OPNAME is the generic (string) name of the operation.
5533    SUFFIX is the character which specifies the number of operands for
5534      the given generic operation.
5535    MODE is the mode to generate for.
5536 */
5537
5538 static void
5539 gen_libfunc (optab optable, const char *opname, int suffix,
5540              enum machine_mode mode)
5541 {
5542   unsigned opname_len = strlen (opname);
5543   const char *mname = GET_MODE_NAME (mode);
5544   unsigned mname_len = strlen (mname);
5545   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5546   int len = prefix_len + opname_len + mname_len + 1 + 1;
5547   char *libfunc_name = XALLOCAVEC (char, len);
5548   char *p;
5549   const char *q;
5550
5551   p = libfunc_name;
5552   *p++ = '_';
5553   *p++ = '_';
5554   if (targetm.libfunc_gnu_prefix)
5555     {
5556       *p++ = 'g';
5557       *p++ = 'n';
5558       *p++ = 'u';
5559       *p++ = '_';
5560     }
5561   for (q = opname; *q; )
5562     *p++ = *q++;
5563   for (q = mname; *q; q++)
5564     *p++ = TOLOWER (*q);
5565   *p++ = suffix;
5566   *p = '\0';
5567
5568   set_optab_libfunc (optable, mode,
5569                      ggc_alloc_string (libfunc_name, p - libfunc_name));
5570 }
5571
5572 /* Like gen_libfunc, but verify that integer operation is involved.  */
5573
5574 void
5575 gen_int_libfunc (optab optable, const char *opname, char suffix,
5576                  enum machine_mode mode)
5577 {
5578   int maxsize = 2 * BITS_PER_WORD;
5579   int minsize = BITS_PER_WORD;
5580
5581   if (GET_MODE_CLASS (mode) != MODE_INT)
5582     return;
5583   if (maxsize < LONG_LONG_TYPE_SIZE)
5584     maxsize = LONG_LONG_TYPE_SIZE;
5585   if (minsize > INT_TYPE_SIZE
5586       && (trapv_binoptab_p (optable)
5587           || trapv_unoptab_p (optable)))
5588     minsize = INT_TYPE_SIZE;
5589   if (GET_MODE_BITSIZE (mode) < minsize
5590       || GET_MODE_BITSIZE (mode) > maxsize)
5591     return;
5592   gen_libfunc (optable, opname, suffix, mode);
5593 }
5594
5595 /* Like gen_libfunc, but verify that FP and set decimal prefix if needed.  */
5596
5597 void
5598 gen_fp_libfunc (optab optable, const char *opname, char suffix,
5599                 enum machine_mode mode)
5600 {
5601   char *dec_opname;
5602
5603   if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5604     gen_libfunc (optable, opname, suffix, mode);
5605   if (DECIMAL_FLOAT_MODE_P (mode))
5606     {
5607       dec_opname = XALLOCAVEC (char, sizeof (DECIMAL_PREFIX) + strlen (opname));
5608       /* For BID support, change the name to have either a bid_ or dpd_ prefix
5609          depending on the low level floating format used.  */
5610       memcpy (dec_opname, DECIMAL_PREFIX, sizeof (DECIMAL_PREFIX) - 1);
5611       strcpy (dec_opname + sizeof (DECIMAL_PREFIX) - 1, opname);
5612       gen_libfunc (optable, dec_opname, suffix, mode);
5613     }
5614 }
5615
5616 /* Like gen_libfunc, but verify that fixed-point operation is involved.  */
5617
5618 void
5619 gen_fixed_libfunc (optab optable, const char *opname, char suffix,
5620                    enum machine_mode mode)
5621 {
5622   if (!ALL_FIXED_POINT_MODE_P (mode))
5623     return;
5624   gen_libfunc (optable, opname, suffix, mode);
5625 }
5626
5627 /* Like gen_libfunc, but verify that signed fixed-point operation is
5628    involved.  */
5629
5630 void
5631 gen_signed_fixed_libfunc (optab optable, const char *opname, char suffix,
5632                           enum machine_mode mode)
5633 {
5634   if (!SIGNED_FIXED_POINT_MODE_P (mode))
5635     return;
5636   gen_libfunc (optable, opname, suffix, mode);
5637 }
5638
5639 /* Like gen_libfunc, but verify that unsigned fixed-point operation is
5640    involved.  */
5641
5642 void
5643 gen_unsigned_fixed_libfunc (optab optable, const char *opname, char suffix,
5644                             enum machine_mode mode)
5645 {
5646   if (!UNSIGNED_FIXED_POINT_MODE_P (mode))
5647     return;
5648   gen_libfunc (optable, opname, suffix, mode);
5649 }
5650
5651 /* Like gen_libfunc, but verify that FP or INT operation is involved.  */
5652
5653 void
5654 gen_int_fp_libfunc (optab optable, const char *name, char suffix,
5655                     enum machine_mode mode)
5656 {
5657   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5658     gen_fp_libfunc (optable, name, suffix, mode);
5659   if (INTEGRAL_MODE_P (mode))
5660     gen_int_libfunc (optable, name, suffix, mode);
5661 }
5662
5663 /* Like gen_libfunc, but verify that FP or INT operation is involved
5664    and add 'v' suffix for integer operation.  */
5665
5666 void
5667 gen_intv_fp_libfunc (optab optable, const char *name, char suffix,
5668                      enum machine_mode mode)
5669 {
5670   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5671     gen_fp_libfunc (optable, name, suffix, mode);
5672   if (GET_MODE_CLASS (mode) == MODE_INT)
5673     {
5674       int len = strlen (name);
5675       char *v_name = XALLOCAVEC (char, len + 2);
5676       strcpy (v_name, name);
5677       v_name[len] = 'v';
5678       v_name[len + 1] = 0;
5679       gen_int_libfunc (optable, v_name, suffix, mode);
5680     }
5681 }
5682
5683 /* Like gen_libfunc, but verify that FP or INT or FIXED operation is
5684    involved.  */
5685
5686 void
5687 gen_int_fp_fixed_libfunc (optab optable, const char *name, char suffix,
5688                           enum machine_mode mode)
5689 {
5690   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5691     gen_fp_libfunc (optable, name, suffix, mode);
5692   if (INTEGRAL_MODE_P (mode))
5693     gen_int_libfunc (optable, name, suffix, mode);
5694   if (ALL_FIXED_POINT_MODE_P (mode))
5695     gen_fixed_libfunc (optable, name, suffix, mode);
5696 }
5697
5698 /* Like gen_libfunc, but verify that FP or INT or signed FIXED operation is
5699    involved.  */
5700
5701 void
5702 gen_int_fp_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5703                                  enum machine_mode mode)
5704 {
5705   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5706     gen_fp_libfunc (optable, name, suffix, mode);
5707   if (INTEGRAL_MODE_P (mode))
5708     gen_int_libfunc (optable, name, suffix, mode);
5709   if (SIGNED_FIXED_POINT_MODE_P (mode))
5710     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5711 }
5712
5713 /* Like gen_libfunc, but verify that INT or FIXED operation is
5714    involved.  */
5715
5716 void
5717 gen_int_fixed_libfunc (optab optable, const char *name, char suffix,
5718                        enum machine_mode mode)
5719 {
5720   if (INTEGRAL_MODE_P (mode))
5721     gen_int_libfunc (optable, name, suffix, mode);
5722   if (ALL_FIXED_POINT_MODE_P (mode))
5723     gen_fixed_libfunc (optable, name, suffix, mode);
5724 }
5725
5726 /* Like gen_libfunc, but verify that INT or signed FIXED operation is
5727    involved.  */
5728
5729 void
5730 gen_int_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5731                               enum machine_mode mode)
5732 {
5733   if (INTEGRAL_MODE_P (mode))
5734     gen_int_libfunc (optable, name, suffix, mode);
5735   if (SIGNED_FIXED_POINT_MODE_P (mode))
5736     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5737 }
5738
5739 /* Like gen_libfunc, but verify that INT or unsigned FIXED operation is
5740    involved.  */
5741
5742 void
5743 gen_int_unsigned_fixed_libfunc (optab optable, const char *name, char suffix,
5744                                 enum machine_mode mode)
5745 {
5746   if (INTEGRAL_MODE_P (mode))
5747     gen_int_libfunc (optable, name, suffix, mode);
5748   if (UNSIGNED_FIXED_POINT_MODE_P (mode))
5749     gen_unsigned_fixed_libfunc (optable, name, suffix, mode);
5750 }
5751
5752 /* Initialize the libfunc fields of an entire group of entries of an
5753    inter-mode-class conversion optab.  The string formation rules are
5754    similar to the ones for init_libfuncs, above, but instead of having
5755    a mode name and an operand count these functions have two mode names
5756    and no operand count.  */
5757
5758 void
5759 gen_interclass_conv_libfunc (convert_optab tab,
5760                              const char *opname,
5761                              enum machine_mode tmode,
5762                              enum machine_mode fmode)
5763 {
5764   size_t opname_len = strlen (opname);
5765   size_t mname_len = 0;
5766
5767   const char *fname, *tname;
5768   const char *q;
5769   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5770   char *libfunc_name, *suffix;
5771   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5772   char *p;
5773
5774   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5775      depends on which underlying decimal floating point format is used.  */
5776   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5777
5778   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5779
5780   nondec_name = XALLOCAVEC (char, prefix_len + opname_len + mname_len + 1 + 1);
5781   nondec_name[0] = '_';
5782   nondec_name[1] = '_';
5783   if (targetm.libfunc_gnu_prefix)
5784     {
5785       nondec_name[2] = 'g';
5786       nondec_name[3] = 'n';
5787       nondec_name[4] = 'u';
5788       nondec_name[5] = '_';
5789     }
5790
5791   memcpy (&nondec_name[prefix_len], opname, opname_len);
5792   nondec_suffix = nondec_name + opname_len + prefix_len;
5793
5794   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5795   dec_name[0] = '_';
5796   dec_name[1] = '_';
5797   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5798   memcpy (&dec_name[2+dec_len], opname, opname_len);
5799   dec_suffix = dec_name + dec_len + opname_len + 2;
5800
5801   fname = GET_MODE_NAME (fmode);
5802   tname = GET_MODE_NAME (tmode);
5803
5804   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5805     {
5806       libfunc_name = dec_name;
5807       suffix = dec_suffix;
5808     }
5809   else
5810     {
5811       libfunc_name = nondec_name;
5812       suffix = nondec_suffix;
5813     }
5814
5815   p = suffix;
5816   for (q = fname; *q; p++, q++)
5817     *p = TOLOWER (*q);
5818   for (q = tname; *q; p++, q++)
5819     *p = TOLOWER (*q);
5820
5821   *p = '\0';
5822
5823   set_conv_libfunc (tab, tmode, fmode,
5824                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5825 }
5826
5827 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5828    int->fp conversion.  */
5829
5830 void
5831 gen_int_to_fp_conv_libfunc (convert_optab tab,
5832                             const char *opname,
5833                             enum machine_mode tmode,
5834                             enum machine_mode fmode)
5835 {
5836   if (GET_MODE_CLASS (fmode) != MODE_INT)
5837     return;
5838   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5839     return;
5840   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5841 }
5842
5843 /* ufloat_optab is special by using floatun for FP and floatuns decimal fp
5844    naming scheme.  */
5845
5846 void
5847 gen_ufloat_conv_libfunc (convert_optab tab,
5848                          const char *opname ATTRIBUTE_UNUSED,
5849                          enum machine_mode tmode,
5850                          enum machine_mode fmode)
5851 {
5852   if (DECIMAL_FLOAT_MODE_P (tmode))
5853     gen_int_to_fp_conv_libfunc (tab, "floatuns", tmode, fmode);
5854   else
5855     gen_int_to_fp_conv_libfunc (tab, "floatun", tmode, fmode);
5856 }
5857
5858 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5859    fp->int conversion.  */
5860
5861 void
5862 gen_int_to_fp_nondecimal_conv_libfunc (convert_optab tab,
5863                                        const char *opname,
5864                                        enum machine_mode tmode,
5865                                        enum machine_mode fmode)
5866 {
5867   if (GET_MODE_CLASS (fmode) != MODE_INT)
5868     return;
5869   if (GET_MODE_CLASS (tmode) != MODE_FLOAT)
5870     return;
5871   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5872 }
5873
5874 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5875    fp->int conversion with no decimal floating point involved.  */
5876
5877 void
5878 gen_fp_to_int_conv_libfunc (convert_optab tab,
5879                             const char *opname,
5880                             enum machine_mode tmode,
5881                             enum machine_mode fmode)
5882 {
5883   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5884     return;
5885   if (GET_MODE_CLASS (tmode) != MODE_INT)
5886     return;
5887   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5888 }
5889
5890 /* Initialize the libfunc fields of an of an intra-mode-class conversion optab.
5891    The string formation rules are
5892    similar to the ones for init_libfunc, above.  */
5893
5894 void
5895 gen_intraclass_conv_libfunc (convert_optab tab, const char *opname,
5896                              enum machine_mode tmode, enum machine_mode fmode)
5897 {
5898   size_t opname_len = strlen (opname);
5899   size_t mname_len = 0;
5900
5901   const char *fname, *tname;
5902   const char *q;
5903   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5904   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5905   char *libfunc_name, *suffix;
5906   char *p;
5907
5908   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5909      depends on which underlying decimal floating point format is used.  */
5910   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5911
5912   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5913
5914   nondec_name = XALLOCAVEC (char, 2 + opname_len + mname_len + 1 + 1);
5915   nondec_name[0] = '_';
5916   nondec_name[1] = '_';
5917   if (targetm.libfunc_gnu_prefix)
5918     {
5919       nondec_name[2] = 'g';
5920       nondec_name[3] = 'n';
5921       nondec_name[4] = 'u';
5922       nondec_name[5] = '_';
5923     }
5924   memcpy (&nondec_name[prefix_len], opname, opname_len);
5925   nondec_suffix = nondec_name + opname_len + prefix_len;
5926
5927   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5928   dec_name[0] = '_';
5929   dec_name[1] = '_';
5930   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5931   memcpy (&dec_name[2 + dec_len], opname, opname_len);
5932   dec_suffix = dec_name + dec_len + opname_len + 2;
5933
5934   fname = GET_MODE_NAME (fmode);
5935   tname = GET_MODE_NAME (tmode);
5936
5937   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5938     {
5939       libfunc_name = dec_name;
5940       suffix = dec_suffix;
5941     }
5942   else
5943     {
5944       libfunc_name = nondec_name;
5945       suffix = nondec_suffix;
5946     }
5947
5948   p = suffix;
5949   for (q = fname; *q; p++, q++)
5950     *p = TOLOWER (*q);
5951   for (q = tname; *q; p++, q++)
5952     *p = TOLOWER (*q);
5953
5954   *p++ = '2';
5955   *p = '\0';
5956
5957   set_conv_libfunc (tab, tmode, fmode,
5958                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5959 }
5960
5961 /* Pick proper libcall for trunc_optab.  We need to chose if we do
5962    truncation or extension and interclass or intraclass.  */
5963
5964 void
5965 gen_trunc_conv_libfunc (convert_optab tab,
5966                          const char *opname,
5967                          enum machine_mode tmode,
5968                          enum machine_mode fmode)
5969 {
5970   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5971     return;
5972   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5973     return;
5974   if (tmode == fmode)
5975     return;
5976
5977   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5978       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5979      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5980
5981   if (GET_MODE_PRECISION (fmode) <= GET_MODE_PRECISION (tmode))
5982     return;
5983
5984   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5985        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5986       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5987     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5988 }
5989
5990 /* Pick proper libcall for extend_optab.  We need to chose if we do
5991    truncation or extension and interclass or intraclass.  */
5992
5993 void
5994 gen_extend_conv_libfunc (convert_optab tab,
5995                          const char *opname ATTRIBUTE_UNUSED,
5996                          enum machine_mode tmode,
5997                          enum machine_mode fmode)
5998 {
5999   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
6000     return;
6001   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
6002     return;
6003   if (tmode == fmode)
6004     return;
6005
6006   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
6007       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
6008      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6009
6010   if (GET_MODE_PRECISION (fmode) > GET_MODE_PRECISION (tmode))
6011     return;
6012
6013   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
6014        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
6015       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
6016     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6017 }
6018
6019 /* Pick proper libcall for fract_optab.  We need to chose if we do
6020    interclass or intraclass.  */
6021
6022 void
6023 gen_fract_conv_libfunc (convert_optab tab,
6024                         const char *opname,
6025                         enum machine_mode tmode,
6026                         enum machine_mode fmode)
6027 {
6028   if (tmode == fmode)
6029     return;
6030   if (!(ALL_FIXED_POINT_MODE_P (tmode) || ALL_FIXED_POINT_MODE_P (fmode)))
6031     return;
6032
6033   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6034     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6035   else
6036     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6037 }
6038
6039 /* Pick proper libcall for fractuns_optab.  */
6040
6041 void
6042 gen_fractuns_conv_libfunc (convert_optab tab,
6043                            const char *opname,
6044                            enum machine_mode tmode,
6045                            enum machine_mode fmode)
6046 {
6047   if (tmode == fmode)
6048     return;
6049   /* One mode must be a fixed-point mode, and the other must be an integer
6050      mode. */
6051   if (!((ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT)
6052         || (ALL_FIXED_POINT_MODE_P (fmode)
6053             && GET_MODE_CLASS (tmode) == MODE_INT)))
6054     return;
6055
6056   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6057 }
6058
6059 /* Pick proper libcall for satfract_optab.  We need to chose if we do
6060    interclass or intraclass.  */
6061
6062 void
6063 gen_satfract_conv_libfunc (convert_optab tab,
6064                            const char *opname,
6065                            enum machine_mode tmode,
6066                            enum machine_mode fmode)
6067 {
6068   if (tmode == fmode)
6069     return;
6070   /* TMODE must be a fixed-point mode.  */
6071   if (!ALL_FIXED_POINT_MODE_P (tmode))
6072     return;
6073
6074   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6075     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6076   else
6077     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6078 }
6079
6080 /* Pick proper libcall for satfractuns_optab.  */
6081
6082 void
6083 gen_satfractuns_conv_libfunc (convert_optab tab,
6084                               const char *opname,
6085                               enum machine_mode tmode,
6086                               enum machine_mode fmode)
6087 {
6088   if (tmode == fmode)
6089     return;
6090   /* TMODE must be a fixed-point mode, and FMODE must be an integer mode. */
6091   if (!(ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT))
6092     return;
6093
6094   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6095 }
6096
6097 /* Hashtable callbacks for libfunc_decls.  */
6098
6099 struct libfunc_decl_hasher : ggc_hasher<tree>
6100 {
6101   static hashval_t
6102   hash (tree entry)
6103   {
6104     return IDENTIFIER_HASH_VALUE (DECL_NAME (entry));
6105   }
6106
6107   static bool
6108   equal (tree decl, tree name)
6109   {
6110     return DECL_NAME (decl) == name;
6111   }
6112 };
6113
6114 /* A table of previously-created libfuncs, hashed by name.  */
6115 static GTY (()) hash_table<libfunc_decl_hasher> *libfunc_decls;
6116
6117 /* Build a decl for a libfunc named NAME. */
6118
6119 tree
6120 build_libfunc_function (const char *name)
6121 {
6122   tree decl = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL,
6123                           get_identifier (name),
6124                           build_function_type (integer_type_node, NULL_TREE));
6125   /* ??? We don't have any type information except for this is
6126      a function.  Pretend this is "int foo()".  */
6127   DECL_ARTIFICIAL (decl) = 1;
6128   DECL_EXTERNAL (decl) = 1;
6129   TREE_PUBLIC (decl) = 1;
6130   gcc_assert (DECL_ASSEMBLER_NAME (decl));
6131
6132   /* Zap the nonsensical SYMBOL_REF_DECL for this.  What we're left with
6133      are the flags assigned by targetm.encode_section_info.  */
6134   SET_SYMBOL_REF_DECL (XEXP (DECL_RTL (decl), 0), NULL);
6135
6136   return decl;
6137 }
6138
6139 rtx
6140 init_one_libfunc (const char *name)
6141 {
6142   tree id, decl;
6143   hashval_t hash;
6144
6145   if (libfunc_decls == NULL)
6146     libfunc_decls = hash_table<libfunc_decl_hasher>::create_ggc (37);
6147
6148   /* See if we have already created a libfunc decl for this function.  */
6149   id = get_identifier (name);
6150   hash = IDENTIFIER_HASH_VALUE (id);
6151   tree *slot = libfunc_decls->find_slot_with_hash (id, hash, INSERT);
6152   decl = *slot;
6153   if (decl == NULL)
6154     {
6155       /* Create a new decl, so that it can be passed to
6156          targetm.encode_section_info.  */
6157       decl = build_libfunc_function (name);
6158       *slot = decl;
6159     }
6160   return XEXP (DECL_RTL (decl), 0);
6161 }
6162
6163 /* Adjust the assembler name of libfunc NAME to ASMSPEC.  */
6164
6165 rtx
6166 set_user_assembler_libfunc (const char *name, const char *asmspec)
6167 {
6168   tree id, decl;
6169   hashval_t hash;
6170
6171   id = get_identifier (name);
6172   hash = IDENTIFIER_HASH_VALUE (id);
6173   tree *slot = libfunc_decls->find_slot_with_hash (id, hash, NO_INSERT);
6174   gcc_assert (slot);
6175   decl = (tree) *slot;
6176   set_user_assembler_name (decl, asmspec);
6177   return XEXP (DECL_RTL (decl), 0);
6178 }
6179
6180 /* Call this to reset the function entry for one optab (OPTABLE) in mode
6181    MODE to NAME, which should be either 0 or a string constant.  */
6182 void
6183 set_optab_libfunc (optab op, enum machine_mode mode, const char *name)
6184 {
6185   rtx val;
6186   struct libfunc_entry e;
6187   struct libfunc_entry **slot;
6188
6189   e.op = op;
6190   e.mode1 = mode;
6191   e.mode2 = VOIDmode;
6192
6193   if (name)
6194     val = init_one_libfunc (name);
6195   else
6196     val = 0;
6197   slot = libfunc_hash->find_slot (&e, INSERT);
6198   if (*slot == NULL)
6199     *slot = ggc_alloc<libfunc_entry> ();
6200   (*slot)->op = op;
6201   (*slot)->mode1 = mode;
6202   (*slot)->mode2 = VOIDmode;
6203   (*slot)->libfunc = val;
6204 }
6205
6206 /* Call this to reset the function entry for one conversion optab
6207    (OPTABLE) from mode FMODE to mode TMODE to NAME, which should be
6208    either 0 or a string constant.  */
6209 void
6210 set_conv_libfunc (convert_optab optab, enum machine_mode tmode,
6211                   enum machine_mode fmode, const char *name)
6212 {
6213   rtx val;
6214   struct libfunc_entry e;
6215   struct libfunc_entry **slot;
6216
6217   e.op = optab;
6218   e.mode1 = tmode;
6219   e.mode2 = fmode;
6220
6221   if (name)
6222     val = init_one_libfunc (name);
6223   else
6224     val = 0;
6225   slot = libfunc_hash->find_slot (&e, INSERT);
6226   if (*slot == NULL)
6227     *slot = ggc_alloc<libfunc_entry> ();
6228   (*slot)->op = optab;
6229   (*slot)->mode1 = tmode;
6230   (*slot)->mode2 = fmode;
6231   (*slot)->libfunc = val;
6232 }
6233
6234 /* Call this to initialize the contents of the optabs
6235    appropriately for the current target machine.  */
6236
6237 void
6238 init_optabs (void)
6239 {
6240   if (libfunc_hash)
6241     libfunc_hash->empty ();
6242   else
6243     libfunc_hash = hash_table<libfunc_hasher>::create_ggc (10);
6244
6245   /* Fill in the optabs with the insns we support.  */
6246   init_all_optabs (this_fn_optabs);
6247
6248   /* The ffs function operates on `int'.  Fall back on it if we do not
6249      have a libgcc2 function for that width.  */
6250   if (INT_TYPE_SIZE < BITS_PER_WORD)
6251     set_optab_libfunc (ffs_optab, mode_for_size (INT_TYPE_SIZE, MODE_INT, 0),
6252                        "ffs");
6253
6254   /* Explicitly initialize the bswap libfuncs since we need them to be
6255      valid for things other than word_mode.  */
6256   if (targetm.libfunc_gnu_prefix)
6257     {
6258       set_optab_libfunc (bswap_optab, SImode, "__gnu_bswapsi2");
6259       set_optab_libfunc (bswap_optab, DImode, "__gnu_bswapdi2");
6260     }
6261   else
6262     {
6263       set_optab_libfunc (bswap_optab, SImode, "__bswapsi2");
6264       set_optab_libfunc (bswap_optab, DImode, "__bswapdi2");
6265     }
6266
6267   /* Use cabs for double complex abs, since systems generally have cabs.
6268      Don't define any libcall for float complex, so that cabs will be used.  */
6269   if (complex_double_type_node)
6270     set_optab_libfunc (abs_optab, TYPE_MODE (complex_double_type_node),
6271                        "cabs");
6272
6273   abort_libfunc = init_one_libfunc ("abort");
6274   memcpy_libfunc = init_one_libfunc ("memcpy");
6275   memmove_libfunc = init_one_libfunc ("memmove");
6276   memcmp_libfunc = init_one_libfunc ("memcmp");
6277   memset_libfunc = init_one_libfunc ("memset");
6278   setbits_libfunc = init_one_libfunc ("__setbits");
6279
6280 #ifndef DONT_USE_BUILTIN_SETJMP
6281   setjmp_libfunc = init_one_libfunc ("__builtin_setjmp");
6282   longjmp_libfunc = init_one_libfunc ("__builtin_longjmp");
6283 #else
6284   setjmp_libfunc = init_one_libfunc ("setjmp");
6285   longjmp_libfunc = init_one_libfunc ("longjmp");
6286 #endif
6287   unwind_sjlj_register_libfunc = init_one_libfunc ("_Unwind_SjLj_Register");
6288   unwind_sjlj_unregister_libfunc
6289     = init_one_libfunc ("_Unwind_SjLj_Unregister");
6290
6291   /* For function entry/exit instrumentation.  */
6292   profile_function_entry_libfunc
6293     = init_one_libfunc ("__cyg_profile_func_enter");
6294   profile_function_exit_libfunc
6295     = init_one_libfunc ("__cyg_profile_func_exit");
6296
6297   gcov_flush_libfunc = init_one_libfunc ("__gcov_flush");
6298
6299   /* Allow the target to add more libcalls or rename some, etc.  */
6300   targetm.init_libfuncs ();
6301 }
6302
6303 /* Use the current target and options to initialize
6304    TREE_OPTIMIZATION_OPTABS (OPTNODE).  */
6305
6306 void
6307 init_tree_optimization_optabs (tree optnode)
6308 {
6309   /* Quick exit if we have already computed optabs for this target.  */
6310   if (TREE_OPTIMIZATION_BASE_OPTABS (optnode) == this_target_optabs)
6311     return;
6312
6313   /* Forget any previous information and set up for the current target.  */
6314   TREE_OPTIMIZATION_BASE_OPTABS (optnode) = this_target_optabs;
6315   struct target_optabs *tmp_optabs = (struct target_optabs *)
6316     TREE_OPTIMIZATION_OPTABS (optnode);
6317   if (tmp_optabs)
6318     memset (tmp_optabs, 0, sizeof (struct target_optabs));
6319   else
6320     tmp_optabs = ggc_alloc<target_optabs> ();
6321
6322   /* Generate a new set of optabs into tmp_optabs.  */
6323   init_all_optabs (tmp_optabs);
6324
6325   /* If the optabs changed, record it.  */
6326   if (memcmp (tmp_optabs, this_target_optabs, sizeof (struct target_optabs)))
6327     TREE_OPTIMIZATION_OPTABS (optnode) = tmp_optabs;
6328   else
6329     {
6330       TREE_OPTIMIZATION_OPTABS (optnode) = NULL;
6331       ggc_free (tmp_optabs);
6332     }
6333 }
6334
6335 /* A helper function for init_sync_libfuncs.  Using the basename BASE,
6336    install libfuncs into TAB for BASE_N for 1 <= N <= MAX.  */
6337
6338 static void
6339 init_sync_libfuncs_1 (optab tab, const char *base, int max)
6340 {
6341   enum machine_mode mode;
6342   char buf[64];
6343   size_t len = strlen (base);
6344   int i;
6345
6346   gcc_assert (max <= 8);
6347   gcc_assert (len + 3 < sizeof (buf));
6348
6349   memcpy (buf, base, len);
6350   buf[len] = '_';
6351   buf[len + 1] = '0';
6352   buf[len + 2] = '\0';
6353
6354   mode = QImode;
6355   for (i = 1; i <= max; i *= 2)
6356     {
6357       buf[len + 1] = '0' + i;
6358       set_optab_libfunc (tab, mode, buf);
6359       mode = GET_MODE_2XWIDER_MODE (mode);
6360     }
6361 }
6362
6363 void
6364 init_sync_libfuncs (int max)
6365 {
6366   if (!flag_sync_libcalls)
6367     return;
6368
6369   init_sync_libfuncs_1 (sync_compare_and_swap_optab,
6370                         "__sync_val_compare_and_swap", max);
6371   init_sync_libfuncs_1 (sync_lock_test_and_set_optab,
6372                         "__sync_lock_test_and_set", max);
6373
6374   init_sync_libfuncs_1 (sync_old_add_optab, "__sync_fetch_and_add", max);
6375   init_sync_libfuncs_1 (sync_old_sub_optab, "__sync_fetch_and_sub", max);
6376   init_sync_libfuncs_1 (sync_old_ior_optab, "__sync_fetch_and_or", max);
6377   init_sync_libfuncs_1 (sync_old_and_optab, "__sync_fetch_and_and", max);
6378   init_sync_libfuncs_1 (sync_old_xor_optab, "__sync_fetch_and_xor", max);
6379   init_sync_libfuncs_1 (sync_old_nand_optab, "__sync_fetch_and_nand", max);
6380
6381   init_sync_libfuncs_1 (sync_new_add_optab, "__sync_add_and_fetch", max);
6382   init_sync_libfuncs_1 (sync_new_sub_optab, "__sync_sub_and_fetch", max);
6383   init_sync_libfuncs_1 (sync_new_ior_optab, "__sync_or_and_fetch", max);
6384   init_sync_libfuncs_1 (sync_new_and_optab, "__sync_and_and_fetch", max);
6385   init_sync_libfuncs_1 (sync_new_xor_optab, "__sync_xor_and_fetch", max);
6386   init_sync_libfuncs_1 (sync_new_nand_optab, "__sync_nand_and_fetch", max);
6387 }
6388
6389 /* Print information about the current contents of the optabs on
6390    STDERR.  */
6391
6392 DEBUG_FUNCTION void
6393 debug_optab_libfuncs (void)
6394 {
6395   int i, j, k;
6396
6397   /* Dump the arithmetic optabs.  */
6398   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
6399     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6400       {
6401         rtx l = optab_libfunc ((optab) i, (enum machine_mode) j);
6402         if (l)
6403           {
6404             gcc_assert (GET_CODE (l) == SYMBOL_REF);
6405             fprintf (stderr, "%s\t%s:\t%s\n",
6406                      GET_RTX_NAME (optab_to_code ((optab) i)),
6407                      GET_MODE_NAME (j),
6408                      XSTR (l, 0));
6409           }
6410       }
6411
6412   /* Dump the conversion optabs.  */
6413   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
6414     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6415       for (k = 0; k < NUM_MACHINE_MODES; ++k)
6416         {
6417           rtx l = convert_optab_libfunc ((optab) i, (enum machine_mode) j,
6418                                          (enum machine_mode) k);
6419           if (l)
6420             {
6421               gcc_assert (GET_CODE (l) == SYMBOL_REF);
6422               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
6423                        GET_RTX_NAME (optab_to_code ((optab) i)),
6424                        GET_MODE_NAME (j),
6425                        GET_MODE_NAME (k),
6426                        XSTR (l, 0));
6427             }
6428         }
6429 }
6430
6431 \f
6432 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
6433    CODE.  Return 0 on failure.  */
6434
6435 rtx
6436 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
6437 {
6438   enum machine_mode mode = GET_MODE (op1);
6439   enum insn_code icode;
6440   rtx insn;
6441   rtx trap_rtx;
6442
6443   if (mode == VOIDmode)
6444     return 0;
6445
6446   icode = optab_handler (ctrap_optab, mode);
6447   if (icode == CODE_FOR_nothing)
6448     return 0;
6449
6450   /* Some targets only accept a zero trap code.  */
6451   if (!insn_operand_matches (icode, 3, tcode))
6452     return 0;
6453
6454   do_pending_stack_adjust ();
6455   start_sequence ();
6456   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
6457                     &trap_rtx, &mode);
6458   if (!trap_rtx)
6459     insn = NULL_RTX;
6460   else
6461     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
6462                             tcode);
6463
6464   /* If that failed, then give up.  */
6465   if (insn == 0)
6466     {
6467       end_sequence ();
6468       return 0;
6469     }
6470
6471   emit_insn (insn);
6472   insn = get_insns ();
6473   end_sequence ();
6474   return insn;
6475 }
6476
6477 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
6478    or unsigned operation code.  */
6479
6480 static enum rtx_code
6481 get_rtx_code (enum tree_code tcode, bool unsignedp)
6482 {
6483   enum rtx_code code;
6484   switch (tcode)
6485     {
6486     case EQ_EXPR:
6487       code = EQ;
6488       break;
6489     case NE_EXPR:
6490       code = NE;
6491       break;
6492     case LT_EXPR:
6493       code = unsignedp ? LTU : LT;
6494       break;
6495     case LE_EXPR:
6496       code = unsignedp ? LEU : LE;
6497       break;
6498     case GT_EXPR:
6499       code = unsignedp ? GTU : GT;
6500       break;
6501     case GE_EXPR:
6502       code = unsignedp ? GEU : GE;
6503       break;
6504
6505     case UNORDERED_EXPR:
6506       code = UNORDERED;
6507       break;
6508     case ORDERED_EXPR:
6509       code = ORDERED;
6510       break;
6511     case UNLT_EXPR:
6512       code = UNLT;
6513       break;
6514     case UNLE_EXPR:
6515       code = UNLE;
6516       break;
6517     case UNGT_EXPR:
6518       code = UNGT;
6519       break;
6520     case UNGE_EXPR:
6521       code = UNGE;
6522       break;
6523     case UNEQ_EXPR:
6524       code = UNEQ;
6525       break;
6526     case LTGT_EXPR:
6527       code = LTGT;
6528       break;
6529
6530     default:
6531       gcc_unreachable ();
6532     }
6533   return code;
6534 }
6535
6536 /* Return comparison rtx for COND. Use UNSIGNEDP to select signed or
6537    unsigned operators. Do not generate compare instruction.  */
6538
6539 static rtx
6540 vector_compare_rtx (enum tree_code tcode, tree t_op0, tree t_op1,
6541                     bool unsignedp, enum insn_code icode)
6542 {
6543   struct expand_operand ops[2];
6544   rtx rtx_op0, rtx_op1;
6545   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
6546
6547   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
6548
6549   /* Expand operands.  */
6550   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
6551                          EXPAND_STACK_PARM);
6552   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
6553                          EXPAND_STACK_PARM);
6554
6555   create_input_operand (&ops[0], rtx_op0, GET_MODE (rtx_op0));
6556   create_input_operand (&ops[1], rtx_op1, GET_MODE (rtx_op1));
6557   if (!maybe_legitimize_operands (icode, 4, 2, ops))
6558     gcc_unreachable ();
6559   return gen_rtx_fmt_ee (rcode, VOIDmode, ops[0].value, ops[1].value);
6560 }
6561
6562 /* Return true if VEC_PERM_EXPR can be expanded using SIMD extensions
6563    of the CPU.  SEL may be NULL, which stands for an unknown constant.  */
6564
6565 bool
6566 can_vec_perm_p (enum machine_mode mode, bool variable,
6567                 const unsigned char *sel)
6568 {
6569   enum machine_mode qimode;
6570
6571   /* If the target doesn't implement a vector mode for the vector type,
6572      then no operations are supported.  */
6573   if (!VECTOR_MODE_P (mode))
6574     return false;
6575
6576   if (!variable)
6577     {
6578       if (direct_optab_handler (vec_perm_const_optab, mode) != CODE_FOR_nothing
6579           && (sel == NULL
6580               || targetm.vectorize.vec_perm_const_ok == NULL
6581               || targetm.vectorize.vec_perm_const_ok (mode, sel)))
6582         return true;
6583     }
6584
6585   if (direct_optab_handler (vec_perm_optab, mode) != CODE_FOR_nothing)
6586     return true;
6587
6588   /* We allow fallback to a QI vector mode, and adjust the mask.  */
6589   if (GET_MODE_INNER (mode) == QImode)
6590     return false;
6591   qimode = mode_for_vector (QImode, GET_MODE_SIZE (mode));
6592   if (!VECTOR_MODE_P (qimode))
6593     return false;
6594
6595   /* ??? For completeness, we ought to check the QImode version of
6596       vec_perm_const_optab.  But all users of this implicit lowering
6597       feature implement the variable vec_perm_optab.  */
6598   if (direct_optab_handler (vec_perm_optab, qimode) == CODE_FOR_nothing)
6599     return false;
6600
6601   /* In order to support the lowering of variable permutations,
6602      we need to support shifts and adds.  */
6603   if (variable)
6604     {
6605       if (GET_MODE_UNIT_SIZE (mode) > 2
6606           && optab_handler (ashl_optab, mode) == CODE_FOR_nothing
6607           && optab_handler (vashl_optab, mode) == CODE_FOR_nothing)
6608         return false;
6609       if (optab_handler (add_optab, qimode) == CODE_FOR_nothing)
6610         return false;
6611     }
6612
6613   return true;
6614 }
6615
6616 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
6617
6618 static rtx
6619 expand_vec_perm_1 (enum insn_code icode, rtx target,
6620                    rtx v0, rtx v1, rtx sel)
6621 {
6622   enum machine_mode tmode = GET_MODE (target);
6623   enum machine_mode smode = GET_MODE (sel);
6624   struct expand_operand ops[4];
6625
6626   create_output_operand (&ops[0], target, tmode);
6627   create_input_operand (&ops[3], sel, smode);
6628
6629   /* Make an effort to preserve v0 == v1.  The target expander is able to
6630      rely on this to determine if we're permuting a single input operand.  */
6631   if (rtx_equal_p (v0, v1))
6632     {
6633       if (!insn_operand_matches (icode, 1, v0))
6634         v0 = force_reg (tmode, v0);
6635       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
6636       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
6637
6638       create_fixed_operand (&ops[1], v0);
6639       create_fixed_operand (&ops[2], v0);
6640     }
6641   else
6642     {
6643       create_input_operand (&ops[1], v0, tmode);
6644       create_input_operand (&ops[2], v1, tmode);
6645     }
6646
6647   if (maybe_expand_insn (icode, 4, ops))
6648     return ops[0].value;
6649   return NULL_RTX;
6650 }
6651
6652 /* Generate instructions for vec_perm optab given its mode
6653    and three operands.  */
6654
6655 rtx
6656 expand_vec_perm (enum machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
6657 {
6658   enum insn_code icode;
6659   enum machine_mode qimode;
6660   unsigned int i, w, e, u;
6661   rtx tmp, sel_qi = NULL;
6662   rtvec vec;
6663
6664   if (!target || GET_MODE (target) != mode)
6665     target = gen_reg_rtx (mode);
6666
6667   w = GET_MODE_SIZE (mode);
6668   e = GET_MODE_NUNITS (mode);
6669   u = GET_MODE_UNIT_SIZE (mode);
6670
6671   /* Set QIMODE to a different vector mode with byte elements.
6672      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
6673   qimode = VOIDmode;
6674   if (GET_MODE_INNER (mode) != QImode)
6675     {
6676       qimode = mode_for_vector (QImode, w);
6677       if (!VECTOR_MODE_P (qimode))
6678         qimode = VOIDmode;
6679     }
6680
6681   /* If the input is a constant, expand it specially.  */
6682   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
6683   if (GET_CODE (sel) == CONST_VECTOR)
6684     {
6685       icode = direct_optab_handler (vec_perm_const_optab, mode);
6686       if (icode != CODE_FOR_nothing)
6687         {
6688           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6689           if (tmp)
6690             return tmp;
6691         }
6692
6693       /* Fall back to a constant byte-based permutation.  */
6694       if (qimode != VOIDmode)
6695         {
6696           vec = rtvec_alloc (w);
6697           for (i = 0; i < e; ++i)
6698             {
6699               unsigned int j, this_e;
6700
6701               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
6702               this_e &= 2 * e - 1;
6703               this_e *= u;
6704
6705               for (j = 0; j < u; ++j)
6706                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
6707             }
6708           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
6709
6710           icode = direct_optab_handler (vec_perm_const_optab, qimode);
6711           if (icode != CODE_FOR_nothing)
6712             {
6713               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6714               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6715                                        gen_lowpart (qimode, v1), sel_qi);
6716               if (tmp)
6717                 return gen_lowpart (mode, tmp);
6718             }
6719         }
6720     }
6721
6722   /* Otherwise expand as a fully variable permuation.  */
6723   icode = direct_optab_handler (vec_perm_optab, mode);
6724   if (icode != CODE_FOR_nothing)
6725     {
6726       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6727       if (tmp)
6728         return tmp;
6729     }
6730
6731   /* As a special case to aid several targets, lower the element-based
6732      permutation to a byte-based permutation and try again.  */
6733   if (qimode == VOIDmode)
6734     return NULL_RTX;
6735   icode = direct_optab_handler (vec_perm_optab, qimode);
6736   if (icode == CODE_FOR_nothing)
6737     return NULL_RTX;
6738
6739   if (sel_qi == NULL)
6740     {
6741       /* Multiply each element by its byte size.  */
6742       enum machine_mode selmode = GET_MODE (sel);
6743       if (u == 2)
6744         sel = expand_simple_binop (selmode, PLUS, sel, sel,
6745                                    sel, 0, OPTAB_DIRECT);
6746       else
6747         sel = expand_simple_binop (selmode, ASHIFT, sel,
6748                                    GEN_INT (exact_log2 (u)),
6749                                    sel, 0, OPTAB_DIRECT);
6750       gcc_assert (sel != NULL);
6751
6752       /* Broadcast the low byte each element into each of its bytes.  */
6753       vec = rtvec_alloc (w);
6754       for (i = 0; i < w; ++i)
6755         {
6756           int this_e = i / u * u;
6757           if (BYTES_BIG_ENDIAN)
6758             this_e += u - 1;
6759           RTVEC_ELT (vec, i) = GEN_INT (this_e);
6760         }
6761       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6762       sel = gen_lowpart (qimode, sel);
6763       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
6764       gcc_assert (sel != NULL);
6765
6766       /* Add the byte offset to each byte element.  */
6767       /* Note that the definition of the indicies here is memory ordering,
6768          so there should be no difference between big and little endian.  */
6769       vec = rtvec_alloc (w);
6770       for (i = 0; i < w; ++i)
6771         RTVEC_ELT (vec, i) = GEN_INT (i % u);
6772       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6773       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
6774                                     sel, 0, OPTAB_DIRECT);
6775       gcc_assert (sel_qi != NULL);
6776     }
6777
6778   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6779   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6780                            gen_lowpart (qimode, v1), sel_qi);
6781   if (tmp)
6782     tmp = gen_lowpart (mode, tmp);
6783   return tmp;
6784 }
6785
6786 /* Return insn code for a conditional operator with a comparison in
6787    mode CMODE, unsigned if UNS is true, resulting in a value of mode VMODE.  */
6788
6789 static inline enum insn_code
6790 get_vcond_icode (enum machine_mode vmode, enum machine_mode cmode, bool uns)
6791 {
6792   enum insn_code icode = CODE_FOR_nothing;
6793   if (uns)
6794     icode = convert_optab_handler (vcondu_optab, vmode, cmode);
6795   else
6796     icode = convert_optab_handler (vcond_optab, vmode, cmode);
6797   return icode;
6798 }
6799
6800 /* Return TRUE iff, appropriate vector insns are available
6801    for vector cond expr with vector type VALUE_TYPE and a comparison
6802    with operand vector types in CMP_OP_TYPE.  */
6803
6804 bool
6805 expand_vec_cond_expr_p (tree value_type, tree cmp_op_type)
6806 {
6807   enum machine_mode value_mode = TYPE_MODE (value_type);
6808   enum machine_mode cmp_op_mode = TYPE_MODE (cmp_op_type);
6809   if (GET_MODE_SIZE (value_mode) != GET_MODE_SIZE (cmp_op_mode)
6810       || GET_MODE_NUNITS (value_mode) != GET_MODE_NUNITS (cmp_op_mode)
6811       || get_vcond_icode (TYPE_MODE (value_type), TYPE_MODE (cmp_op_type),
6812                           TYPE_UNSIGNED (cmp_op_type)) == CODE_FOR_nothing)
6813     return false;
6814   return true;
6815 }
6816
6817 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
6818    three operands.  */
6819
6820 rtx
6821 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
6822                       rtx target)
6823 {
6824   struct expand_operand ops[6];
6825   enum insn_code icode;
6826   rtx comparison, rtx_op1, rtx_op2;
6827   enum machine_mode mode = TYPE_MODE (vec_cond_type);
6828   enum machine_mode cmp_op_mode;
6829   bool unsignedp;
6830   tree op0a, op0b;
6831   enum tree_code tcode;
6832
6833   if (COMPARISON_CLASS_P (op0))
6834     {
6835       op0a = TREE_OPERAND (op0, 0);
6836       op0b = TREE_OPERAND (op0, 1);
6837       tcode = TREE_CODE (op0);
6838     }
6839   else
6840     {
6841       /* Fake op0 < 0.  */
6842       gcc_assert (!TYPE_UNSIGNED (TREE_TYPE (op0)));
6843       op0a = op0;
6844       op0b = build_zero_cst (TREE_TYPE (op0));
6845       tcode = LT_EXPR;
6846     }
6847   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
6848   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
6849
6850
6851   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
6852               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
6853
6854   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
6855   if (icode == CODE_FOR_nothing)
6856     return 0;
6857
6858   comparison = vector_compare_rtx (tcode, op0a, op0b, unsignedp, icode);
6859   rtx_op1 = expand_normal (op1);
6860   rtx_op2 = expand_normal (op2);
6861
6862   create_output_operand (&ops[0], target, mode);
6863   create_input_operand (&ops[1], rtx_op1, mode);
6864   create_input_operand (&ops[2], rtx_op2, mode);
6865   create_fixed_operand (&ops[3], comparison);
6866   create_fixed_operand (&ops[4], XEXP (comparison, 0));
6867   create_fixed_operand (&ops[5], XEXP (comparison, 1));
6868   expand_insn (icode, 6, ops);
6869   return ops[0].value;
6870 }
6871
6872 /* Return non-zero if a highpart multiply is supported of can be synthisized.
6873    For the benefit of expand_mult_highpart, the return value is 1 for direct,
6874    2 for even/odd widening, and 3 for hi/lo widening.  */
6875
6876 int
6877 can_mult_highpart_p (enum machine_mode mode, bool uns_p)
6878 {
6879   optab op;
6880   unsigned char *sel;
6881   unsigned i, nunits;
6882
6883   op = uns_p ? umul_highpart_optab : smul_highpart_optab;
6884   if (optab_handler (op, mode) != CODE_FOR_nothing)
6885     return 1;
6886
6887   /* If the mode is an integral vector, synth from widening operations.  */
6888   if (GET_MODE_CLASS (mode) != MODE_VECTOR_INT)
6889     return 0;
6890
6891   nunits = GET_MODE_NUNITS (mode);
6892   sel = XALLOCAVEC (unsigned char, nunits);
6893
6894   op = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6895   if (optab_handler (op, mode) != CODE_FOR_nothing)
6896     {
6897       op = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6898       if (optab_handler (op, mode) != CODE_FOR_nothing)
6899         {
6900           for (i = 0; i < nunits; ++i)
6901             sel[i] = !BYTES_BIG_ENDIAN + (i & ~1) + ((i & 1) ? nunits : 0);
6902           if (can_vec_perm_p (mode, false, sel))
6903             return 2;
6904         }
6905     }
6906
6907   op = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6908   if (optab_handler (op, mode) != CODE_FOR_nothing)
6909     {
6910       op = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6911       if (optab_handler (op, mode) != CODE_FOR_nothing)
6912         {
6913           for (i = 0; i < nunits; ++i)
6914             sel[i] = 2 * i + (BYTES_BIG_ENDIAN ? 0 : 1);
6915           if (can_vec_perm_p (mode, false, sel))
6916             return 3;
6917         }
6918     }
6919
6920   return 0;
6921 }
6922
6923 /* Expand a highpart multiply.  */
6924
6925 rtx
6926 expand_mult_highpart (enum machine_mode mode, rtx op0, rtx op1,
6927                       rtx target, bool uns_p)
6928 {
6929   struct expand_operand eops[3];
6930   enum insn_code icode;
6931   int method, i, nunits;
6932   enum machine_mode wmode;
6933   rtx m1, m2, perm;
6934   optab tab1, tab2;
6935   rtvec v;
6936
6937   method = can_mult_highpart_p (mode, uns_p);
6938   switch (method)
6939     {
6940     case 0:
6941       return NULL_RTX;
6942     case 1:
6943       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
6944       return expand_binop (mode, tab1, op0, op1, target, uns_p,
6945                            OPTAB_LIB_WIDEN);
6946     case 2:
6947       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6948       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6949       break;
6950     case 3:
6951       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6952       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6953       if (BYTES_BIG_ENDIAN)
6954         {
6955           optab t = tab1;
6956           tab1 = tab2;
6957           tab2 = t;
6958         }
6959       break;
6960     default:
6961       gcc_unreachable ();
6962     }
6963
6964   icode = optab_handler (tab1, mode);
6965   nunits = GET_MODE_NUNITS (mode);
6966   wmode = insn_data[icode].operand[0].mode;
6967   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
6968   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
6969
6970   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6971   create_input_operand (&eops[1], op0, mode);
6972   create_input_operand (&eops[2], op1, mode);
6973   expand_insn (icode, 3, eops);
6974   m1 = gen_lowpart (mode, eops[0].value);
6975
6976   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6977   create_input_operand (&eops[1], op0, mode);
6978   create_input_operand (&eops[2], op1, mode);
6979   expand_insn (optab_handler (tab2, mode), 3, eops);
6980   m2 = gen_lowpart (mode, eops[0].value);
6981
6982   v = rtvec_alloc (nunits);
6983   if (method == 2)
6984     {
6985       for (i = 0; i < nunits; ++i)
6986         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
6987                                     + ((i & 1) ? nunits : 0));
6988     }
6989   else
6990     {
6991       for (i = 0; i < nunits; ++i)
6992         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
6993     }
6994   perm = gen_rtx_CONST_VECTOR (mode, v);
6995
6996   return expand_vec_perm (mode, m1, m2, perm, target);
6997 }
6998
6999 /* Return true if target supports vector masked load/store for mode.  */
7000 bool
7001 can_vec_mask_load_store_p (enum machine_mode mode, bool is_load)
7002 {
7003   optab op = is_load ? maskload_optab : maskstore_optab;
7004   enum machine_mode vmode;
7005   unsigned int vector_sizes;
7006
7007   /* If mode is vector mode, check it directly.  */
7008   if (VECTOR_MODE_P (mode))
7009     return optab_handler (op, mode) != CODE_FOR_nothing;
7010
7011   /* Otherwise, return true if there is some vector mode with
7012      the mask load/store supported.  */
7013
7014   /* See if there is any chance the mask load or store might be
7015      vectorized.  If not, punt.  */
7016   vmode = targetm.vectorize.preferred_simd_mode (mode);
7017   if (!VECTOR_MODE_P (vmode))
7018     return false;
7019
7020   if (optab_handler (op, vmode) != CODE_FOR_nothing)
7021     return true;
7022
7023   vector_sizes = targetm.vectorize.autovectorize_vector_sizes ();
7024   while (vector_sizes != 0)
7025     {
7026       unsigned int cur = 1 << floor_log2 (vector_sizes);
7027       vector_sizes &= ~cur;
7028       if (cur <= GET_MODE_SIZE (mode))
7029         continue;
7030       vmode = mode_for_vector (mode, cur / GET_MODE_SIZE (mode));
7031       if (VECTOR_MODE_P (vmode)
7032           && optab_handler (op, vmode) != CODE_FOR_nothing)
7033         return true;
7034     }
7035   return false;
7036 }
7037 \f
7038 /* Return true if there is a compare_and_swap pattern.  */
7039
7040 bool
7041 can_compare_and_swap_p (enum machine_mode mode, bool allow_libcall)
7042 {
7043   enum insn_code icode;
7044
7045   /* Check for __atomic_compare_and_swap.  */
7046   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7047   if (icode != CODE_FOR_nothing)
7048     return true;
7049
7050   /* Check for __sync_compare_and_swap.  */
7051   icode = optab_handler (sync_compare_and_swap_optab, mode);
7052   if (icode != CODE_FOR_nothing)
7053     return true;
7054   if (allow_libcall && optab_libfunc (sync_compare_and_swap_optab, mode))
7055     return true;
7056
7057   /* No inline compare and swap.  */
7058   return false;
7059 }
7060
7061 /* Return true if an atomic exchange can be performed.  */
7062
7063 bool
7064 can_atomic_exchange_p (enum machine_mode mode, bool allow_libcall)
7065 {
7066   enum insn_code icode;
7067
7068   /* Check for __atomic_exchange.  */
7069   icode = direct_optab_handler (atomic_exchange_optab, mode);
7070   if (icode != CODE_FOR_nothing)
7071     return true;
7072
7073   /* Don't check __sync_test_and_set, as on some platforms that
7074      has reduced functionality.  Targets that really do support
7075      a proper exchange should simply be updated to the __atomics.  */
7076
7077   return can_compare_and_swap_p (mode, allow_libcall);
7078 }
7079
7080
7081 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
7082    pattern.  */
7083
7084 static void
7085 find_cc_set (rtx x, const_rtx pat, void *data)
7086 {
7087   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
7088       && GET_CODE (pat) == SET)
7089     {
7090       rtx *p_cc_reg = (rtx *) data;
7091       gcc_assert (!*p_cc_reg);
7092       *p_cc_reg = x;
7093     }
7094 }
7095
7096 /* This is a helper function for the other atomic operations.  This function
7097    emits a loop that contains SEQ that iterates until a compare-and-swap
7098    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
7099    a set of instructions that takes a value from OLD_REG as an input and
7100    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
7101    set to the current contents of MEM.  After SEQ, a compare-and-swap will
7102    attempt to update MEM with NEW_REG.  The function returns true when the
7103    loop was generated successfully.  */
7104
7105 static bool
7106 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
7107 {
7108   enum machine_mode mode = GET_MODE (mem);
7109   rtx_code_label *label;
7110   rtx cmp_reg, success, oldval;
7111
7112   /* The loop we want to generate looks like
7113
7114         cmp_reg = mem;
7115       label:
7116         old_reg = cmp_reg;
7117         seq;
7118         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
7119         if (success)
7120           goto label;
7121
7122      Note that we only do the plain load from memory once.  Subsequent
7123      iterations use the value loaded by the compare-and-swap pattern.  */
7124
7125   label = gen_label_rtx ();
7126   cmp_reg = gen_reg_rtx (mode);
7127
7128   emit_move_insn (cmp_reg, mem);
7129   emit_label (label);
7130   emit_move_insn (old_reg, cmp_reg);
7131   if (seq)
7132     emit_insn (seq);
7133
7134   success = NULL_RTX;
7135   oldval = cmp_reg;
7136   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
7137                                        new_reg, false, MEMMODEL_SEQ_CST,
7138                                        MEMMODEL_RELAXED))
7139     return false;
7140
7141   if (oldval != cmp_reg)
7142     emit_move_insn (cmp_reg, oldval);
7143
7144   /* Mark this jump predicted not taken.  */
7145   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
7146                            GET_MODE (success), 1, label, 0);
7147   return true;
7148 }
7149
7150
7151 /* This function tries to emit an atomic_exchange intruction.  VAL is written
7152    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
7153    using TARGET if possible.  */
7154
7155 static rtx
7156 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7157 {
7158   enum machine_mode mode = GET_MODE (mem);
7159   enum insn_code icode;
7160
7161   /* If the target supports the exchange directly, great.  */
7162   icode = direct_optab_handler (atomic_exchange_optab, mode);
7163   if (icode != CODE_FOR_nothing)
7164     {
7165       struct expand_operand ops[4];
7166
7167       create_output_operand (&ops[0], target, mode);
7168       create_fixed_operand (&ops[1], mem);
7169       create_input_operand (&ops[2], val, mode);
7170       create_integer_operand (&ops[3], model);
7171       if (maybe_expand_insn (icode, 4, ops))
7172         return ops[0].value;
7173     }
7174
7175   return NULL_RTX;
7176 }
7177
7178 /* This function tries to implement an atomic exchange operation using
7179    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
7180    The previous contents of *MEM are returned, using TARGET if possible.
7181    Since this instructionn is an acquire barrier only, stronger memory
7182    models may require additional barriers to be emitted.  */
7183
7184 static rtx
7185 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
7186                                    enum memmodel model)
7187 {
7188   enum machine_mode mode = GET_MODE (mem);
7189   enum insn_code icode;
7190   rtx_insn *last_insn = get_last_insn ();
7191
7192   icode = optab_handler (sync_lock_test_and_set_optab, mode);
7193
7194   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
7195      exists, and the memory model is stronger than acquire, add a release
7196      barrier before the instruction.  */
7197
7198   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST
7199       || (model & MEMMODEL_MASK) == MEMMODEL_RELEASE
7200       || (model & MEMMODEL_MASK) == MEMMODEL_ACQ_REL)
7201     expand_mem_thread_fence (model);
7202
7203   if (icode != CODE_FOR_nothing)
7204     {
7205       struct expand_operand ops[3];
7206       create_output_operand (&ops[0], target, mode);
7207       create_fixed_operand (&ops[1], mem);
7208       create_input_operand (&ops[2], val, mode);
7209       if (maybe_expand_insn (icode, 3, ops))
7210         return ops[0].value;
7211     }
7212
7213   /* If an external test-and-set libcall is provided, use that instead of
7214      any external compare-and-swap that we might get from the compare-and-
7215      swap-loop expansion later.  */
7216   if (!can_compare_and_swap_p (mode, false))
7217     {
7218       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
7219       if (libfunc != NULL)
7220         {
7221           rtx addr;
7222
7223           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7224           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7225                                           mode, 2, addr, ptr_mode,
7226                                           val, mode);
7227         }
7228     }
7229
7230   /* If the test_and_set can't be emitted, eliminate any barrier that might
7231      have been emitted.  */
7232   delete_insns_since (last_insn);
7233   return NULL_RTX;
7234 }
7235
7236 /* This function tries to implement an atomic exchange operation using a
7237    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
7238    *MEM are returned, using TARGET if possible.  No memory model is required
7239    since a compare_and_swap loop is seq-cst.  */
7240
7241 static rtx
7242 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
7243 {
7244   enum machine_mode mode = GET_MODE (mem);
7245
7246   if (can_compare_and_swap_p (mode, true))
7247     {
7248       if (!target || !register_operand (target, mode))
7249         target = gen_reg_rtx (mode);
7250       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
7251         return target;
7252     }
7253
7254   return NULL_RTX;
7255 }
7256
7257 /* This function tries to implement an atomic test-and-set operation
7258    using the atomic_test_and_set instruction pattern.  A boolean value
7259    is returned from the operation, using TARGET if possible.  */
7260
7261 #ifndef HAVE_atomic_test_and_set
7262 #define HAVE_atomic_test_and_set 0
7263 #define CODE_FOR_atomic_test_and_set CODE_FOR_nothing
7264 #endif
7265
7266 static rtx
7267 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7268 {
7269   enum machine_mode pat_bool_mode;
7270   struct expand_operand ops[3];
7271
7272   if (!HAVE_atomic_test_and_set)
7273     return NULL_RTX;
7274
7275   /* While we always get QImode from __atomic_test_and_set, we get
7276      other memory modes from __sync_lock_test_and_set.  Note that we
7277      use no endian adjustment here.  This matches the 4.6 behavior
7278      in the Sparc backend.  */
7279   gcc_checking_assert
7280     (insn_data[CODE_FOR_atomic_test_and_set].operand[1].mode == QImode);
7281   if (GET_MODE (mem) != QImode)
7282     mem = adjust_address_nv (mem, QImode, 0);
7283
7284   pat_bool_mode = insn_data[CODE_FOR_atomic_test_and_set].operand[0].mode;
7285   create_output_operand (&ops[0], target, pat_bool_mode);
7286   create_fixed_operand (&ops[1], mem);
7287   create_integer_operand (&ops[2], model);
7288
7289   if (maybe_expand_insn (CODE_FOR_atomic_test_and_set, 3, ops))
7290     return ops[0].value;
7291   return NULL_RTX;
7292 }
7293
7294 /* This function expands the legacy _sync_lock test_and_set operation which is
7295    generally an atomic exchange.  Some limited targets only allow the
7296    constant 1 to be stored.  This is an ACQUIRE operation.
7297
7298    TARGET is an optional place to stick the return value.
7299    MEM is where VAL is stored.  */
7300
7301 rtx
7302 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
7303 {
7304   rtx ret;
7305
7306   /* Try an atomic_exchange first.  */
7307   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_ACQUIRE);
7308   if (ret)
7309     return ret;
7310
7311   ret = maybe_emit_sync_lock_test_and_set (target, mem, val, MEMMODEL_ACQUIRE);
7312   if (ret)
7313     return ret;
7314
7315   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7316   if (ret)
7317     return ret;
7318
7319   /* If there are no other options, try atomic_test_and_set if the value
7320      being stored is 1.  */
7321   if (val == const1_rtx)
7322     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_ACQUIRE);
7323
7324   return ret;
7325 }
7326
7327 /* This function expands the atomic test_and_set operation:
7328    atomically store a boolean TRUE into MEM and return the previous value.
7329
7330    MEMMODEL is the memory model variant to use.
7331    TARGET is an optional place to stick the return value.  */
7332
7333 rtx
7334 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7335 {
7336   enum machine_mode mode = GET_MODE (mem);
7337   rtx ret, trueval, subtarget;
7338
7339   ret = maybe_emit_atomic_test_and_set (target, mem, model);
7340   if (ret)
7341     return ret;
7342
7343   /* Be binary compatible with non-default settings of trueval, and different
7344      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
7345      another only has atomic-exchange.  */
7346   if (targetm.atomic_test_and_set_trueval == 1)
7347     {
7348       trueval = const1_rtx;
7349       subtarget = target ? target : gen_reg_rtx (mode);
7350     }
7351   else
7352     {
7353       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
7354       subtarget = gen_reg_rtx (mode);
7355     }
7356
7357   /* Try the atomic-exchange optab...  */
7358   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
7359
7360   /* ... then an atomic-compare-and-swap loop ... */
7361   if (!ret)
7362     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
7363
7364   /* ... before trying the vaguely defined legacy lock_test_and_set. */
7365   if (!ret)
7366     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
7367
7368   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
7369      things with the value 1.  Thus we try again without trueval.  */
7370   if (!ret && targetm.atomic_test_and_set_trueval != 1)
7371     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
7372
7373   /* Failing all else, assume a single threaded environment and simply
7374      perform the operation.  */
7375   if (!ret)
7376     {
7377       /* If the result is ignored skip the move to target.  */
7378       if (subtarget != const0_rtx)
7379         emit_move_insn (subtarget, mem);
7380
7381       emit_move_insn (mem, trueval);
7382       ret = subtarget;
7383     }
7384
7385   /* Recall that have to return a boolean value; rectify if trueval
7386      is not exactly one.  */
7387   if (targetm.atomic_test_and_set_trueval != 1)
7388     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
7389
7390   return ret;
7391 }
7392
7393 /* This function expands the atomic exchange operation:
7394    atomically store VAL in MEM and return the previous value in MEM.
7395
7396    MEMMODEL is the memory model variant to use.
7397    TARGET is an optional place to stick the return value.  */
7398
7399 rtx
7400 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7401 {
7402   rtx ret;
7403
7404   ret = maybe_emit_atomic_exchange (target, mem, val, model);
7405
7406   /* Next try a compare-and-swap loop for the exchange.  */
7407   if (!ret)
7408     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7409
7410   return ret;
7411 }
7412
7413 /* This function expands the atomic compare exchange operation:
7414
7415    *PTARGET_BOOL is an optional place to store the boolean success/failure.
7416    *PTARGET_OVAL is an optional place to store the old value from memory.
7417    Both target parameters may be NULL to indicate that we do not care about
7418    that return value.  Both target parameters are updated on success to
7419    the actual location of the corresponding result.
7420
7421    MEMMODEL is the memory model variant to use.
7422
7423    The return value of the function is true for success.  */
7424
7425 bool
7426 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
7427                                 rtx mem, rtx expected, rtx desired,
7428                                 bool is_weak, enum memmodel succ_model,
7429                                 enum memmodel fail_model)
7430 {
7431   enum machine_mode mode = GET_MODE (mem);
7432   struct expand_operand ops[8];
7433   enum insn_code icode;
7434   rtx target_oval, target_bool = NULL_RTX;
7435   rtx libfunc;
7436
7437   /* Load expected into a register for the compare and swap.  */
7438   if (MEM_P (expected))
7439     expected = copy_to_reg (expected);
7440
7441   /* Make sure we always have some place to put the return oldval.
7442      Further, make sure that place is distinct from the input expected,
7443      just in case we need that path down below.  */
7444   if (ptarget_oval == NULL
7445       || (target_oval = *ptarget_oval) == NULL
7446       || reg_overlap_mentioned_p (expected, target_oval))
7447     target_oval = gen_reg_rtx (mode);
7448
7449   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7450   if (icode != CODE_FOR_nothing)
7451     {
7452       enum machine_mode bool_mode = insn_data[icode].operand[0].mode;
7453
7454       /* Make sure we always have a place for the bool operand.  */
7455       if (ptarget_bool == NULL
7456           || (target_bool = *ptarget_bool) == NULL
7457           || GET_MODE (target_bool) != bool_mode)
7458         target_bool = gen_reg_rtx (bool_mode);
7459
7460       /* Emit the compare_and_swap.  */
7461       create_output_operand (&ops[0], target_bool, bool_mode);
7462       create_output_operand (&ops[1], target_oval, mode);
7463       create_fixed_operand (&ops[2], mem);
7464       create_input_operand (&ops[3], expected, mode);
7465       create_input_operand (&ops[4], desired, mode);
7466       create_integer_operand (&ops[5], is_weak);
7467       create_integer_operand (&ops[6], succ_model);
7468       create_integer_operand (&ops[7], fail_model);
7469       if (maybe_expand_insn (icode, 8, ops))
7470         {
7471           /* Return success/failure.  */
7472           target_bool = ops[0].value;
7473           target_oval = ops[1].value;
7474           goto success;
7475         }
7476     }
7477
7478   /* Otherwise fall back to the original __sync_val_compare_and_swap
7479      which is always seq-cst.  */
7480   icode = optab_handler (sync_compare_and_swap_optab, mode);
7481   if (icode != CODE_FOR_nothing)
7482     {
7483       rtx cc_reg;
7484
7485       create_output_operand (&ops[0], target_oval, mode);
7486       create_fixed_operand (&ops[1], mem);
7487       create_input_operand (&ops[2], expected, mode);
7488       create_input_operand (&ops[3], desired, mode);
7489       if (!maybe_expand_insn (icode, 4, ops))
7490         return false;
7491
7492       target_oval = ops[0].value;
7493
7494       /* If the caller isn't interested in the boolean return value,
7495          skip the computation of it.  */
7496       if (ptarget_bool == NULL)
7497         goto success;
7498
7499       /* Otherwise, work out if the compare-and-swap succeeded.  */
7500       cc_reg = NULL_RTX;
7501       if (have_insn_for (COMPARE, CCmode))
7502         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
7503       if (cc_reg)
7504         {
7505           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
7506                                                const0_rtx, VOIDmode, 0, 1);
7507           goto success;
7508         }
7509       goto success_bool_from_val;
7510     }
7511
7512   /* Also check for library support for __sync_val_compare_and_swap.  */
7513   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
7514   if (libfunc != NULL)
7515     {
7516       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7517       target_oval = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7518                                              mode, 3, addr, ptr_mode,
7519                                              expected, mode, desired, mode);
7520
7521       /* Compute the boolean return value only if requested.  */
7522       if (ptarget_bool)
7523         goto success_bool_from_val;
7524       else
7525         goto success;
7526     }
7527
7528   /* Failure.  */
7529   return false;
7530
7531  success_bool_from_val:
7532    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
7533                                         expected, VOIDmode, 1, 1);
7534  success:
7535   /* Make sure that the oval output winds up where the caller asked.  */
7536   if (ptarget_oval)
7537     *ptarget_oval = target_oval;
7538   if (ptarget_bool)
7539     *ptarget_bool = target_bool;
7540   return true;
7541 }
7542
7543 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
7544
7545 static void
7546 expand_asm_memory_barrier (void)
7547 {
7548   rtx asm_op, clob;
7549
7550   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, empty_string, empty_string, 0,
7551                                  rtvec_alloc (0), rtvec_alloc (0),
7552                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7553   MEM_VOLATILE_P (asm_op) = 1;
7554
7555   clob = gen_rtx_SCRATCH (VOIDmode);
7556   clob = gen_rtx_MEM (BLKmode, clob);
7557   clob = gen_rtx_CLOBBER (VOIDmode, clob);
7558
7559   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
7560 }
7561
7562 /* This routine will either emit the mem_thread_fence pattern or issue a
7563    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7564
7565 #ifndef HAVE_mem_thread_fence
7566 # define HAVE_mem_thread_fence 0
7567 # define gen_mem_thread_fence(x) (gcc_unreachable (), NULL_RTX)
7568 #endif
7569 #ifndef HAVE_memory_barrier
7570 # define HAVE_memory_barrier 0
7571 # define gen_memory_barrier()  (gcc_unreachable (), NULL_RTX)
7572 #endif
7573
7574 void
7575 expand_mem_thread_fence (enum memmodel model)
7576 {
7577   if (HAVE_mem_thread_fence)
7578     emit_insn (gen_mem_thread_fence (GEN_INT (model)));
7579   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7580     {
7581       if (HAVE_memory_barrier)
7582         emit_insn (gen_memory_barrier ());
7583       else if (synchronize_libfunc != NULL_RTX)
7584         emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
7585       else
7586         expand_asm_memory_barrier ();
7587     }
7588 }
7589
7590 /* This routine will either emit the mem_signal_fence pattern or issue a
7591    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7592
7593 #ifndef HAVE_mem_signal_fence
7594 # define HAVE_mem_signal_fence 0
7595 # define gen_mem_signal_fence(x) (gcc_unreachable (), NULL_RTX)
7596 #endif
7597
7598 void
7599 expand_mem_signal_fence (enum memmodel model)
7600 {
7601   if (HAVE_mem_signal_fence)
7602     emit_insn (gen_mem_signal_fence (GEN_INT (model)));
7603   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7604     {
7605       /* By default targets are coherent between a thread and the signal
7606          handler running on the same thread.  Thus this really becomes a
7607          compiler barrier, in that stores must not be sunk past
7608          (or raised above) a given point.  */
7609       expand_asm_memory_barrier ();
7610     }
7611 }
7612
7613 /* This function expands the atomic load operation:
7614    return the atomically loaded value in MEM.
7615
7616    MEMMODEL is the memory model variant to use.
7617    TARGET is an option place to stick the return value.  */
7618
7619 rtx
7620 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
7621 {
7622   enum machine_mode mode = GET_MODE (mem);
7623   enum insn_code icode;
7624
7625   /* If the target supports the load directly, great.  */
7626   icode = direct_optab_handler (atomic_load_optab, mode);
7627   if (icode != CODE_FOR_nothing)
7628     {
7629       struct expand_operand ops[3];
7630
7631       create_output_operand (&ops[0], target, mode);
7632       create_fixed_operand (&ops[1], mem);
7633       create_integer_operand (&ops[2], model);
7634       if (maybe_expand_insn (icode, 3, ops))
7635         return ops[0].value;
7636     }
7637
7638   /* If the size of the object is greater than word size on this target,
7639      then we assume that a load will not be atomic.  */
7640   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7641     {
7642       /* Issue val = compare_and_swap (mem, 0, 0).
7643          This may cause the occasional harmless store of 0 when the value is
7644          already 0, but it seems to be OK according to the standards guys.  */
7645       if (expand_atomic_compare_and_swap (NULL, &target, mem, const0_rtx,
7646                                           const0_rtx, false, model, model))
7647         return target;
7648       else
7649       /* Otherwise there is no atomic load, leave the library call.  */
7650         return NULL_RTX;
7651     }
7652
7653   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
7654   if (!target || target == const0_rtx)
7655     target = gen_reg_rtx (mode);
7656
7657   /* For SEQ_CST, emit a barrier before the load.  */
7658   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7659     expand_mem_thread_fence (model);
7660
7661   emit_move_insn (target, mem);
7662
7663   /* Emit the appropriate barrier after the load.  */
7664   expand_mem_thread_fence (model);
7665
7666   return target;
7667 }
7668
7669 /* This function expands the atomic store operation:
7670    Atomically store VAL in MEM.
7671    MEMMODEL is the memory model variant to use.
7672    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
7673    function returns const0_rtx if a pattern was emitted.  */
7674
7675 rtx
7676 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
7677 {
7678   enum machine_mode mode = GET_MODE (mem);
7679   enum insn_code icode;
7680   struct expand_operand ops[3];
7681
7682   /* If the target supports the store directly, great.  */
7683   icode = direct_optab_handler (atomic_store_optab, mode);
7684   if (icode != CODE_FOR_nothing)
7685     {
7686       create_fixed_operand (&ops[0], mem);
7687       create_input_operand (&ops[1], val, mode);
7688       create_integer_operand (&ops[2], model);
7689       if (maybe_expand_insn (icode, 3, ops))
7690         return const0_rtx;
7691     }
7692
7693   /* If using __sync_lock_release is a viable alternative, try it.  */
7694   if (use_release)
7695     {
7696       icode = direct_optab_handler (sync_lock_release_optab, mode);
7697       if (icode != CODE_FOR_nothing)
7698         {
7699           create_fixed_operand (&ops[0], mem);
7700           create_input_operand (&ops[1], const0_rtx, mode);
7701           if (maybe_expand_insn (icode, 2, ops))
7702             {
7703               /* lock_release is only a release barrier.  */
7704               if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7705                 expand_mem_thread_fence (model);
7706               return const0_rtx;
7707             }
7708         }
7709     }
7710
7711   /* If the size of the object is greater than word size on this target,
7712      a default store will not be atomic, Try a mem_exchange and throw away
7713      the result.  If that doesn't work, don't do anything.  */
7714   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7715     {
7716       rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
7717       if (!target)
7718         target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem, val);
7719       if (target)
7720         return const0_rtx;
7721       else
7722         return NULL_RTX;
7723     }
7724
7725   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
7726   expand_mem_thread_fence (model);
7727
7728   emit_move_insn (mem, val);
7729
7730   /* For SEQ_CST, also emit a barrier after the store.  */
7731   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7732     expand_mem_thread_fence (model);
7733
7734   return const0_rtx;
7735 }
7736
7737
7738 /* Structure containing the pointers and values required to process the
7739    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
7740
7741 struct atomic_op_functions
7742 {
7743   direct_optab mem_fetch_before;
7744   direct_optab mem_fetch_after;
7745   direct_optab mem_no_result;
7746   optab fetch_before;
7747   optab fetch_after;
7748   direct_optab no_result;
7749   enum rtx_code reverse_code;
7750 };
7751
7752
7753 /* Fill in structure pointed to by OP with the various optab entries for an
7754    operation of type CODE.  */
7755
7756 static void
7757 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
7758 {
7759   gcc_assert (op!= NULL);
7760
7761   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
7762      in the source code during compilation, and the optab entries are not
7763      computable until runtime.  Fill in the values at runtime.  */
7764   switch (code)
7765     {
7766     case PLUS:
7767       op->mem_fetch_before = atomic_fetch_add_optab;
7768       op->mem_fetch_after = atomic_add_fetch_optab;
7769       op->mem_no_result = atomic_add_optab;
7770       op->fetch_before = sync_old_add_optab;
7771       op->fetch_after = sync_new_add_optab;
7772       op->no_result = sync_add_optab;
7773       op->reverse_code = MINUS;
7774       break;
7775     case MINUS:
7776       op->mem_fetch_before = atomic_fetch_sub_optab;
7777       op->mem_fetch_after = atomic_sub_fetch_optab;
7778       op->mem_no_result = atomic_sub_optab;
7779       op->fetch_before = sync_old_sub_optab;
7780       op->fetch_after = sync_new_sub_optab;
7781       op->no_result = sync_sub_optab;
7782       op->reverse_code = PLUS;
7783       break;
7784     case XOR:
7785       op->mem_fetch_before = atomic_fetch_xor_optab;
7786       op->mem_fetch_after = atomic_xor_fetch_optab;
7787       op->mem_no_result = atomic_xor_optab;
7788       op->fetch_before = sync_old_xor_optab;
7789       op->fetch_after = sync_new_xor_optab;
7790       op->no_result = sync_xor_optab;
7791       op->reverse_code = XOR;
7792       break;
7793     case AND:
7794       op->mem_fetch_before = atomic_fetch_and_optab;
7795       op->mem_fetch_after = atomic_and_fetch_optab;
7796       op->mem_no_result = atomic_and_optab;
7797       op->fetch_before = sync_old_and_optab;
7798       op->fetch_after = sync_new_and_optab;
7799       op->no_result = sync_and_optab;
7800       op->reverse_code = UNKNOWN;
7801       break;
7802     case IOR:
7803       op->mem_fetch_before = atomic_fetch_or_optab;
7804       op->mem_fetch_after = atomic_or_fetch_optab;
7805       op->mem_no_result = atomic_or_optab;
7806       op->fetch_before = sync_old_ior_optab;
7807       op->fetch_after = sync_new_ior_optab;
7808       op->no_result = sync_ior_optab;
7809       op->reverse_code = UNKNOWN;
7810       break;
7811     case NOT:
7812       op->mem_fetch_before = atomic_fetch_nand_optab;
7813       op->mem_fetch_after = atomic_nand_fetch_optab;
7814       op->mem_no_result = atomic_nand_optab;
7815       op->fetch_before = sync_old_nand_optab;
7816       op->fetch_after = sync_new_nand_optab;
7817       op->no_result = sync_nand_optab;
7818       op->reverse_code = UNKNOWN;
7819       break;
7820     default:
7821       gcc_unreachable ();
7822     }
7823 }
7824
7825 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
7826    using memory order MODEL.  If AFTER is true the operation needs to return
7827    the value of *MEM after the operation, otherwise the previous value.
7828    TARGET is an optional place to place the result.  The result is unused if
7829    it is const0_rtx.
7830    Return the result if there is a better sequence, otherwise NULL_RTX.  */
7831
7832 static rtx
7833 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7834                          enum memmodel model, bool after)
7835 {
7836   /* If the value is prefetched, or not used, it may be possible to replace
7837      the sequence with a native exchange operation.  */
7838   if (!after || target == const0_rtx)
7839     {
7840       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
7841       if (code == AND && val == const0_rtx)
7842         {
7843           if (target == const0_rtx)
7844             target = gen_reg_rtx (GET_MODE (mem));
7845           return maybe_emit_atomic_exchange (target, mem, val, model);
7846         }
7847
7848       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
7849       if (code == IOR && val == constm1_rtx)
7850         {
7851           if (target == const0_rtx)
7852             target = gen_reg_rtx (GET_MODE (mem));
7853           return maybe_emit_atomic_exchange (target, mem, val, model);
7854         }
7855     }
7856
7857   return NULL_RTX;
7858 }
7859
7860 /* Try to emit an instruction for a specific operation varaition.
7861    OPTAB contains the OP functions.
7862    TARGET is an optional place to return the result. const0_rtx means unused.
7863    MEM is the memory location to operate on.
7864    VAL is the value to use in the operation.
7865    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
7866    MODEL is the memory model, if used.
7867    AFTER is true if the returned result is the value after the operation.  */
7868
7869 static rtx
7870 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
7871                rtx val, bool use_memmodel, enum memmodel model, bool after)
7872 {
7873   enum machine_mode mode = GET_MODE (mem);
7874   struct expand_operand ops[4];
7875   enum insn_code icode;
7876   int op_counter = 0;
7877   int num_ops;
7878
7879   /* Check to see if there is a result returned.  */
7880   if (target == const0_rtx)
7881     {
7882       if (use_memmodel)
7883         {
7884           icode = direct_optab_handler (optab->mem_no_result, mode);
7885           create_integer_operand (&ops[2], model);
7886           num_ops = 3;
7887         }
7888       else
7889         {
7890           icode = direct_optab_handler (optab->no_result, mode);
7891           num_ops = 2;
7892         }
7893     }
7894   /* Otherwise, we need to generate a result.  */
7895   else
7896     {
7897       if (use_memmodel)
7898         {
7899           icode = direct_optab_handler (after ? optab->mem_fetch_after
7900                                         : optab->mem_fetch_before, mode);
7901           create_integer_operand (&ops[3], model);
7902           num_ops = 4;
7903         }
7904       else
7905         {
7906           icode = optab_handler (after ? optab->fetch_after
7907                                  : optab->fetch_before, mode);
7908           num_ops = 3;
7909         }
7910       create_output_operand (&ops[op_counter++], target, mode);
7911     }
7912   if (icode == CODE_FOR_nothing)
7913     return NULL_RTX;
7914
7915   create_fixed_operand (&ops[op_counter++], mem);
7916   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
7917   create_convert_operand_to (&ops[op_counter++], val, mode, true);
7918
7919   if (maybe_expand_insn (icode, num_ops, ops))
7920     return (target == const0_rtx ? const0_rtx : ops[0].value);
7921
7922   return NULL_RTX;
7923 }
7924
7925
7926 /* This function expands an atomic fetch_OP or OP_fetch operation:
7927    TARGET is an option place to stick the return value.  const0_rtx indicates
7928    the result is unused.
7929    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7930    CODE is the operation being performed (OP)
7931    MEMMODEL is the memory model variant to use.
7932    AFTER is true to return the result of the operation (OP_fetch).
7933    AFTER is false to return the value before the operation (fetch_OP).
7934
7935    This function will *only* generate instructions if there is a direct
7936    optab. No compare and swap loops or libcalls will be generated. */
7937
7938 static rtx
7939 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
7940                                     enum rtx_code code, enum memmodel model,
7941                                     bool after)
7942 {
7943   enum machine_mode mode = GET_MODE (mem);
7944   struct atomic_op_functions optab;
7945   rtx result;
7946   bool unused_result = (target == const0_rtx);
7947
7948   get_atomic_op_for_code (&optab, code);
7949
7950   /* Check to see if there are any better instructions.  */
7951   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
7952   if (result)
7953     return result;
7954
7955   /* Check for the case where the result isn't used and try those patterns.  */
7956   if (unused_result)
7957     {
7958       /* Try the memory model variant first.  */
7959       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
7960       if (result)
7961         return result;
7962
7963       /* Next try the old style withuot a memory model.  */
7964       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
7965       if (result)
7966         return result;
7967
7968       /* There is no no-result pattern, so try patterns with a result.  */
7969       target = NULL_RTX;
7970     }
7971
7972   /* Try the __atomic version.  */
7973   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
7974   if (result)
7975     return result;
7976
7977   /* Try the older __sync version.  */
7978   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
7979   if (result)
7980     return result;
7981
7982   /* If the fetch value can be calculated from the other variation of fetch,
7983      try that operation.  */
7984   if (after || unused_result || optab.reverse_code != UNKNOWN)
7985     {
7986       /* Try the __atomic version, then the older __sync version.  */
7987       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
7988       if (!result)
7989         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
7990
7991       if (result)
7992         {
7993           /* If the result isn't used, no need to do compensation code.  */
7994           if (unused_result)
7995             return result;
7996
7997           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
7998              Fetch_before == after REVERSE_OP val.  */
7999           if (!after)
8000             code = optab.reverse_code;
8001           if (code == NOT)
8002             {
8003               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
8004                                             true, OPTAB_LIB_WIDEN);
8005               result = expand_simple_unop (mode, NOT, result, target, true);
8006             }
8007           else
8008             result = expand_simple_binop (mode, code, result, val, target,
8009                                           true, OPTAB_LIB_WIDEN);
8010           return result;
8011         }
8012     }
8013
8014   /* No direct opcode can be generated.  */
8015   return NULL_RTX;
8016 }
8017
8018
8019
8020 /* This function expands an atomic fetch_OP or OP_fetch operation:
8021    TARGET is an option place to stick the return value.  const0_rtx indicates
8022    the result is unused.
8023    atomically fetch MEM, perform the operation with VAL and return it to MEM.
8024    CODE is the operation being performed (OP)
8025    MEMMODEL is the memory model variant to use.
8026    AFTER is true to return the result of the operation (OP_fetch).
8027    AFTER is false to return the value before the operation (fetch_OP).  */
8028 rtx
8029 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
8030                         enum memmodel model, bool after)
8031 {
8032   enum machine_mode mode = GET_MODE (mem);
8033   rtx result;
8034   bool unused_result = (target == const0_rtx);
8035
8036   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
8037                                                after);
8038
8039   if (result)
8040     return result;
8041
8042   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
8043   if (code == PLUS || code == MINUS)
8044     {
8045       rtx tmp;
8046       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
8047
8048       start_sequence ();
8049       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
8050       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
8051                                                    model, after);
8052       if (result)
8053         {
8054           /* PLUS worked so emit the insns and return.  */
8055           tmp = get_insns ();
8056           end_sequence ();
8057           emit_insn (tmp);
8058           return result;
8059         }
8060
8061       /* PLUS did not work, so throw away the negation code and continue.  */
8062       end_sequence ();
8063     }
8064
8065   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
8066   if (!can_compare_and_swap_p (mode, false))
8067     {
8068       rtx libfunc;
8069       bool fixup = false;
8070       enum rtx_code orig_code = code;
8071       struct atomic_op_functions optab;
8072
8073       get_atomic_op_for_code (&optab, code);
8074       libfunc = optab_libfunc (after ? optab.fetch_after
8075                                : optab.fetch_before, mode);
8076       if (libfunc == NULL
8077           && (after || unused_result || optab.reverse_code != UNKNOWN))
8078         {
8079           fixup = true;
8080           if (!after)
8081             code = optab.reverse_code;
8082           libfunc = optab_libfunc (after ? optab.fetch_before
8083                                    : optab.fetch_after, mode);
8084         }
8085       if (libfunc != NULL)
8086         {
8087           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
8088           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
8089                                             2, addr, ptr_mode, val, mode);
8090
8091           if (!unused_result && fixup)
8092             result = expand_simple_binop (mode, code, result, val, target,
8093                                           true, OPTAB_LIB_WIDEN);
8094           return result;
8095         }
8096
8097       /* We need the original code for any further attempts.  */
8098       code = orig_code;
8099     }
8100
8101   /* If nothing else has succeeded, default to a compare and swap loop.  */
8102   if (can_compare_and_swap_p (mode, true))
8103     {
8104       rtx_insn *insn;
8105       rtx t0 = gen_reg_rtx (mode), t1;
8106
8107       start_sequence ();
8108
8109       /* If the result is used, get a register for it.  */
8110       if (!unused_result)
8111         {
8112           if (!target || !register_operand (target, mode))
8113             target = gen_reg_rtx (mode);
8114           /* If fetch_before, copy the value now.  */
8115           if (!after)
8116             emit_move_insn (target, t0);
8117         }
8118       else
8119         target = const0_rtx;
8120
8121       t1 = t0;
8122       if (code == NOT)
8123         {
8124           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
8125                                     true, OPTAB_LIB_WIDEN);
8126           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
8127         }
8128       else
8129         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
8130                                   OPTAB_LIB_WIDEN);
8131
8132       /* For after, copy the value now.  */
8133       if (!unused_result && after)
8134         emit_move_insn (target, t1);
8135       insn = get_insns ();
8136       end_sequence ();
8137
8138       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
8139         return target;
8140     }
8141
8142   return NULL_RTX;
8143 }
8144 \f
8145 /* Return true if OPERAND is suitable for operand number OPNO of
8146    instruction ICODE.  */
8147
8148 bool
8149 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
8150 {
8151   return (!insn_data[(int) icode].operand[opno].predicate
8152           || (insn_data[(int) icode].operand[opno].predicate
8153               (operand, insn_data[(int) icode].operand[opno].mode)));
8154 }
8155 \f
8156 /* TARGET is a target of a multiword operation that we are going to
8157    implement as a series of word-mode operations.  Return true if
8158    TARGET is suitable for this purpose.  */
8159
8160 bool
8161 valid_multiword_target_p (rtx target)
8162 {
8163   enum machine_mode mode;
8164   int i;
8165
8166   mode = GET_MODE (target);
8167   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
8168     if (!validate_subreg (word_mode, mode, target, i))
8169       return false;
8170   return true;
8171 }
8172
8173 /* Like maybe_legitimize_operand, but do not change the code of the
8174    current rtx value.  */
8175
8176 static bool
8177 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
8178                                     struct expand_operand *op)
8179 {
8180   /* See if the operand matches in its current form.  */
8181   if (insn_operand_matches (icode, opno, op->value))
8182     return true;
8183
8184   /* If the operand is a memory whose address has no side effects,
8185      try forcing the address into a non-virtual pseudo register.
8186      The check for side effects is important because copy_to_mode_reg
8187      cannot handle things like auto-modified addresses.  */
8188   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
8189     {
8190       rtx addr, mem;
8191
8192       mem = op->value;
8193       addr = XEXP (mem, 0);
8194       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
8195           && !side_effects_p (addr))
8196         {
8197           rtx_insn *last;
8198           enum machine_mode mode;
8199
8200           last = get_last_insn ();
8201           mode = get_address_mode (mem);
8202           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
8203           if (insn_operand_matches (icode, opno, mem))
8204             {
8205               op->value = mem;
8206               return true;
8207             }
8208           delete_insns_since (last);
8209         }
8210     }
8211
8212   return false;
8213 }
8214
8215 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
8216    on success, storing the new operand value back in OP.  */
8217
8218 static bool
8219 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
8220                           struct expand_operand *op)
8221 {
8222   enum machine_mode mode, imode;
8223   bool old_volatile_ok, result;
8224
8225   mode = op->mode;
8226   switch (op->type)
8227     {
8228     case EXPAND_FIXED:
8229       old_volatile_ok = volatile_ok;
8230       volatile_ok = true;
8231       result = maybe_legitimize_operand_same_code (icode, opno, op);
8232       volatile_ok = old_volatile_ok;
8233       return result;
8234
8235     case EXPAND_OUTPUT:
8236       gcc_assert (mode != VOIDmode);
8237       if (op->value
8238           && op->value != const0_rtx
8239           && GET_MODE (op->value) == mode
8240           && maybe_legitimize_operand_same_code (icode, opno, op))
8241         return true;
8242
8243       op->value = gen_reg_rtx (mode);
8244       break;
8245
8246     case EXPAND_INPUT:
8247     input:
8248       gcc_assert (mode != VOIDmode);
8249       gcc_assert (GET_MODE (op->value) == VOIDmode
8250                   || GET_MODE (op->value) == mode);
8251       if (maybe_legitimize_operand_same_code (icode, opno, op))
8252         return true;
8253
8254       op->value = copy_to_mode_reg (mode, op->value);
8255       break;
8256
8257     case EXPAND_CONVERT_TO:
8258       gcc_assert (mode != VOIDmode);
8259       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
8260       goto input;
8261
8262     case EXPAND_CONVERT_FROM:
8263       if (GET_MODE (op->value) != VOIDmode)
8264         mode = GET_MODE (op->value);
8265       else
8266         /* The caller must tell us what mode this value has.  */
8267         gcc_assert (mode != VOIDmode);
8268
8269       imode = insn_data[(int) icode].operand[opno].mode;
8270       if (imode != VOIDmode && imode != mode)
8271         {
8272           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
8273           mode = imode;
8274         }
8275       goto input;
8276
8277     case EXPAND_ADDRESS:
8278       gcc_assert (mode != VOIDmode);
8279       op->value = convert_memory_address (mode, op->value);
8280       goto input;
8281
8282     case EXPAND_INTEGER:
8283       mode = insn_data[(int) icode].operand[opno].mode;
8284       if (mode != VOIDmode && const_int_operand (op->value, mode))
8285         goto input;
8286       break;
8287     }
8288   return insn_operand_matches (icode, opno, op->value);
8289 }
8290
8291 /* Make OP describe an input operand that should have the same value
8292    as VALUE, after any mode conversion that the target might request.
8293    TYPE is the type of VALUE.  */
8294
8295 void
8296 create_convert_operand_from_type (struct expand_operand *op,
8297                                   rtx value, tree type)
8298 {
8299   create_convert_operand_from (op, value, TYPE_MODE (type),
8300                                TYPE_UNSIGNED (type));
8301 }
8302
8303 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
8304    of instruction ICODE.  Return true on success, leaving the new operand
8305    values in the OPS themselves.  Emit no code on failure.  */
8306
8307 bool
8308 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
8309                            unsigned int nops, struct expand_operand *ops)
8310 {
8311   rtx_insn *last;
8312   unsigned int i;
8313
8314   last = get_last_insn ();
8315   for (i = 0; i < nops; i++)
8316     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
8317       {
8318         delete_insns_since (last);
8319         return false;
8320       }
8321   return true;
8322 }
8323
8324 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
8325    as its operands.  Return the instruction pattern on success,
8326    and emit any necessary set-up code.  Return null and emit no
8327    code on failure.  */
8328
8329 rtx
8330 maybe_gen_insn (enum insn_code icode, unsigned int nops,
8331                 struct expand_operand *ops)
8332 {
8333   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
8334   if (!maybe_legitimize_operands (icode, 0, nops, ops))
8335     return NULL_RTX;
8336
8337   switch (nops)
8338     {
8339     case 1:
8340       return GEN_FCN (icode) (ops[0].value);
8341     case 2:
8342       return GEN_FCN (icode) (ops[0].value, ops[1].value);
8343     case 3:
8344       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
8345     case 4:
8346       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8347                               ops[3].value);
8348     case 5:
8349       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8350                               ops[3].value, ops[4].value);
8351     case 6:
8352       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8353                               ops[3].value, ops[4].value, ops[5].value);
8354     case 7:
8355       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8356                               ops[3].value, ops[4].value, ops[5].value,
8357                               ops[6].value);
8358     case 8:
8359       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8360                               ops[3].value, ops[4].value, ops[5].value,
8361                               ops[6].value, ops[7].value);
8362     case 9:
8363       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8364                               ops[3].value, ops[4].value, ops[5].value,
8365                               ops[6].value, ops[7].value, ops[8].value);
8366     }
8367   gcc_unreachable ();
8368 }
8369
8370 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
8371    as its operands.  Return true on success and emit no code on failure.  */
8372
8373 bool
8374 maybe_expand_insn (enum insn_code icode, unsigned int nops,
8375                    struct expand_operand *ops)
8376 {
8377   rtx pat = maybe_gen_insn (icode, nops, ops);
8378   if (pat)
8379     {
8380       emit_insn (pat);
8381       return true;
8382     }
8383   return false;
8384 }
8385
8386 /* Like maybe_expand_insn, but for jumps.  */
8387
8388 bool
8389 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
8390                         struct expand_operand *ops)
8391 {
8392   rtx pat = maybe_gen_insn (icode, nops, ops);
8393   if (pat)
8394     {
8395       emit_jump_insn (pat);
8396       return true;
8397     }
8398   return false;
8399 }
8400
8401 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
8402    as its operands.  */
8403
8404 void
8405 expand_insn (enum insn_code icode, unsigned int nops,
8406              struct expand_operand *ops)
8407 {
8408   if (!maybe_expand_insn (icode, nops, ops))
8409     gcc_unreachable ();
8410 }
8411
8412 /* Like expand_insn, but for jumps.  */
8413
8414 void
8415 expand_jump_insn (enum insn_code icode, unsigned int nops,
8416                   struct expand_operand *ops)
8417 {
8418   if (!maybe_expand_jump_insn (icode, nops, ops))
8419     gcc_unreachable ();
8420 }
8421
8422 /* Reduce conditional compilation elsewhere.  */
8423 #ifndef HAVE_insv
8424 #define HAVE_insv       0
8425 #define CODE_FOR_insv   CODE_FOR_nothing
8426 #endif
8427 #ifndef HAVE_extv
8428 #define HAVE_extv       0
8429 #define CODE_FOR_extv   CODE_FOR_nothing
8430 #endif
8431 #ifndef HAVE_extzv
8432 #define HAVE_extzv      0
8433 #define CODE_FOR_extzv  CODE_FOR_nothing
8434 #endif
8435
8436 /* Enumerates the possible types of structure operand to an
8437    extraction_insn.  */
8438 enum extraction_type { ET_unaligned_mem, ET_reg };
8439
8440 /* Check whether insv, extv or extzv pattern ICODE can be used for an
8441    insertion or extraction of type TYPE on a structure of mode MODE.
8442    Return true if so and fill in *INSN accordingly.  STRUCT_OP is the
8443    operand number of the structure (the first sign_extract or zero_extract
8444    operand) and FIELD_OP is the operand number of the field (the other
8445    side of the set from the sign_extract or zero_extract).  */
8446
8447 static bool
8448 get_traditional_extraction_insn (extraction_insn *insn,
8449                                  enum extraction_type type,
8450                                  enum machine_mode mode,
8451                                  enum insn_code icode,
8452                                  int struct_op, int field_op)
8453 {
8454   const struct insn_data_d *data = &insn_data[icode];
8455
8456   enum machine_mode struct_mode = data->operand[struct_op].mode;
8457   if (struct_mode == VOIDmode)
8458     struct_mode = word_mode;
8459   if (mode != struct_mode)
8460     return false;
8461
8462   enum machine_mode field_mode = data->operand[field_op].mode;
8463   if (field_mode == VOIDmode)
8464     field_mode = word_mode;
8465
8466   enum machine_mode pos_mode = data->operand[struct_op + 2].mode;
8467   if (pos_mode == VOIDmode)
8468     pos_mode = word_mode;
8469
8470   insn->icode = icode;
8471   insn->field_mode = field_mode;
8472   insn->struct_mode = (type == ET_unaligned_mem ? byte_mode : struct_mode);
8473   insn->pos_mode = pos_mode;
8474   return true;
8475 }
8476
8477 /* Return true if an optab exists to perform an insertion or extraction
8478    of type TYPE in mode MODE.  Describe the instruction in *INSN if so.
8479
8480    REG_OPTAB is the optab to use for register structures and
8481    MISALIGN_OPTAB is the optab to use for misaligned memory structures.
8482    POS_OP is the operand number of the bit position.  */
8483
8484 static bool
8485 get_optab_extraction_insn (struct extraction_insn *insn,
8486                            enum extraction_type type,
8487                            enum machine_mode mode, direct_optab reg_optab,
8488                            direct_optab misalign_optab, int pos_op)
8489 {
8490   direct_optab optab = (type == ET_unaligned_mem ? misalign_optab : reg_optab);
8491   enum insn_code icode = direct_optab_handler (optab, mode);
8492   if (icode == CODE_FOR_nothing)
8493     return false;
8494
8495   const struct insn_data_d *data = &insn_data[icode];
8496
8497   insn->icode = icode;
8498   insn->field_mode = mode;
8499   insn->struct_mode = (type == ET_unaligned_mem ? BLKmode : mode);
8500   insn->pos_mode = data->operand[pos_op].mode;
8501   if (insn->pos_mode == VOIDmode)
8502     insn->pos_mode = word_mode;
8503   return true;
8504 }
8505
8506 /* Return true if an instruction exists to perform an insertion or
8507    extraction (PATTERN says which) of type TYPE in mode MODE.
8508    Describe the instruction in *INSN if so.  */
8509
8510 static bool
8511 get_extraction_insn (extraction_insn *insn,
8512                      enum extraction_pattern pattern,
8513                      enum extraction_type type,
8514                      enum machine_mode mode)
8515 {
8516   switch (pattern)
8517     {
8518     case EP_insv:
8519       if (HAVE_insv
8520           && get_traditional_extraction_insn (insn, type, mode,
8521                                               CODE_FOR_insv, 0, 3))
8522         return true;
8523       return get_optab_extraction_insn (insn, type, mode, insv_optab,
8524                                         insvmisalign_optab, 2);
8525
8526     case EP_extv:
8527       if (HAVE_extv
8528           && get_traditional_extraction_insn (insn, type, mode,
8529                                               CODE_FOR_extv, 1, 0))
8530         return true;
8531       return get_optab_extraction_insn (insn, type, mode, extv_optab,
8532                                         extvmisalign_optab, 3);
8533
8534     case EP_extzv:
8535       if (HAVE_extzv
8536           && get_traditional_extraction_insn (insn, type, mode,
8537                                               CODE_FOR_extzv, 1, 0))
8538         return true;
8539       return get_optab_extraction_insn (insn, type, mode, extzv_optab,
8540                                         extzvmisalign_optab, 3);
8541
8542     default:
8543       gcc_unreachable ();
8544     }
8545 }
8546
8547 /* Return true if an instruction exists to access a field of mode
8548    FIELDMODE in a structure that has STRUCT_BITS significant bits.
8549    Describe the "best" such instruction in *INSN if so.  PATTERN and
8550    TYPE describe the type of insertion or extraction we want to perform.
8551
8552    For an insertion, the number of significant structure bits includes
8553    all bits of the target.  For an extraction, it need only include the
8554    most significant bit of the field.  Larger widths are acceptable
8555    in both cases.  */
8556
8557 static bool
8558 get_best_extraction_insn (extraction_insn *insn,
8559                           enum extraction_pattern pattern,
8560                           enum extraction_type type,
8561                           unsigned HOST_WIDE_INT struct_bits,
8562                           enum machine_mode field_mode)
8563 {
8564   enum machine_mode mode = smallest_mode_for_size (struct_bits, MODE_INT);
8565   while (mode != VOIDmode)
8566     {
8567       if (get_extraction_insn (insn, pattern, type, mode))
8568         {
8569           while (mode != VOIDmode
8570                  && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (field_mode)
8571                  && !TRULY_NOOP_TRUNCATION_MODES_P (insn->field_mode,
8572                                                     field_mode))
8573             {
8574               get_extraction_insn (insn, pattern, type, mode);
8575               mode = GET_MODE_WIDER_MODE (mode);
8576             }
8577           return true;
8578         }
8579       mode = GET_MODE_WIDER_MODE (mode);
8580     }
8581   return false;
8582 }
8583
8584 /* Return true if an instruction exists to access a field of mode
8585    FIELDMODE in a register structure that has STRUCT_BITS significant bits.
8586    Describe the "best" such instruction in *INSN if so.  PATTERN describes
8587    the type of insertion or extraction we want to perform.
8588
8589    For an insertion, the number of significant structure bits includes
8590    all bits of the target.  For an extraction, it need only include the
8591    most significant bit of the field.  Larger widths are acceptable
8592    in both cases.  */
8593
8594 bool
8595 get_best_reg_extraction_insn (extraction_insn *insn,
8596                               enum extraction_pattern pattern,
8597                               unsigned HOST_WIDE_INT struct_bits,
8598                               enum machine_mode field_mode)
8599 {
8600   return get_best_extraction_insn (insn, pattern, ET_reg, struct_bits,
8601                                    field_mode);
8602 }
8603
8604 /* Return true if an instruction exists to access a field of BITSIZE
8605    bits starting BITNUM bits into a memory structure.  Describe the
8606    "best" such instruction in *INSN if so.  PATTERN describes the type
8607    of insertion or extraction we want to perform and FIELDMODE is the
8608    natural mode of the extracted field.
8609
8610    The instructions considered here only access bytes that overlap
8611    the bitfield; they do not touch any surrounding bytes.  */
8612
8613 bool
8614 get_best_mem_extraction_insn (extraction_insn *insn,
8615                               enum extraction_pattern pattern,
8616                               HOST_WIDE_INT bitsize, HOST_WIDE_INT bitnum,
8617                               enum machine_mode field_mode)
8618 {
8619   unsigned HOST_WIDE_INT struct_bits = (bitnum % BITS_PER_UNIT
8620                                         + bitsize
8621                                         + BITS_PER_UNIT - 1);
8622   struct_bits -= struct_bits % BITS_PER_UNIT;
8623   return get_best_extraction_insn (insn, pattern, ET_unaligned_mem,
8624                                    struct_bits, field_mode);
8625 }
8626
8627 #include "gt-optabs.h"