gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2015 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "tm.h"
  25 #include "diagnostic-core.h"
  26
  27 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  28    is properly defined.  */
  29 #include "insn-config.h"
  30 #include "rtl.h"
  31 #include "hash-set.h"
  32 #include "machmode.h"
  33 #include "vec.h"
  34 #include "double-int.h"
  35 #include "input.h"
  36 #include "alias.h"
  37 #include "symtab.h"
  38 #include "wide-int.h"
  39 #include "inchash.h"
  40 #include "tree.h"
  41 #include "tree-hasher.h"
  42 #include "stor-layout.h"
  43 #include "stringpool.h"
  44 #include "varasm.h"
  45 #include "tm_p.h"
  46 #include "flags.h"
  47 #include "hard-reg-set.h"
  48 #include "function.h"
  49 #include "except.h"
  50 #include "hashtab.h"
  51 #include "statistics.h"
  52 #include "real.h"
  53 #include "fixed-value.h"
  54 #include "expmed.h"
  55 #include "dojump.h"
  56 #include "explow.h"
  57 #include "calls.h"
  58 #include "emit-rtl.h"
  59 #include "stmt.h"
  60 #include "expr.h"
  61 #include "insn-codes.h"
  62 #include "optabs.h"
  63 #include "libfuncs.h"
  64 #include "recog.h"
  65 #include "reload.h"
  66 #include "ggc.h"
  67 #include "predict.h"
  68 #include "dominance.h"
  69 #include "cfg.h"
  70 #include "basic-block.h"
  71 #include "target.h"
  72
  73 struct target_optabs default_target_optabs;
  74 struct target_libfuncs default_target_libfuncs;
  75 struct target_optabs *this_fn_optabs = &default_target_optabs;
  76 #if SWITCHABLE_TARGET
  77 struct target_optabs *this_target_optabs = &default_target_optabs;
  78 struct target_libfuncs *this_target_libfuncs = &default_target_libfuncs;
  79 #endif
  80
  81 #define libfunc_hash \
  82   (this_target_libfuncs->x_libfunc_hash)
  83
  84 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  85                                    machine_mode *);
  86 static rtx expand_unop_direct (machine_mode, optab, rtx, rtx, int);
  87 static void emit_libcall_block_1 (rtx_insn *, rtx, rtx, rtx, bool);
  88
  89 /* Debug facility for use in GDB.  */
  90 void debug_optab_libfuncs (void);
  91
  92 /* Prefixes for the current version of decimal floating point (BID vs. DPD) */
  93 #if ENABLE_DECIMAL_BID_FORMAT
  94 #define DECIMAL_PREFIX "bid_"
  95 #else
  96 #define DECIMAL_PREFIX "dpd_"
  97 #endif
  98 \f
  99 /* Used for libfunc_hash.  */
 100
 101 hashval_t
 102 libfunc_hasher::hash (libfunc_entry *e)
 103 {
 104   return ((e->mode1 + e->mode2 * NUM_MACHINE_MODES) ^ e->op);
 105 }
 106
 107 /* Used for libfunc_hash.  */
 108
 109 bool
 110 libfunc_hasher::equal (libfunc_entry *e1, libfunc_entry *e2)
 111 {
 112   return e1->op == e2->op && e1->mode1 == e2->mode1 && e1->mode2 == e2->mode2;
 113 }
 114
 115 /* Return libfunc corresponding operation defined by OPTAB converting
 116    from MODE2 to MODE1.  Trigger lazy initialization if needed, return NULL
 117    if no libfunc is available.  */
 118 rtx
 119 convert_optab_libfunc (convert_optab optab, machine_mode mode1,
 120                        machine_mode mode2)
 121 {
 122   struct libfunc_entry e;
 123   struct libfunc_entry **slot;
 124
 125   /* ??? This ought to be an assert, but not all of the places
 126      that we expand optabs know about the optabs that got moved
 127      to being direct.  */
 128   if (!(optab >= FIRST_CONV_OPTAB && optab <= LAST_CONVLIB_OPTAB))
 129     return NULL_RTX;
 130
 131   e.op = optab;
 132   e.mode1 = mode1;
 133   e.mode2 = mode2;
 134   slot = libfunc_hash->find_slot (&e, NO_INSERT);
 135   if (!slot)
 136     {
 137       const struct convert_optab_libcall_d *d
 138         = &convlib_def[optab - FIRST_CONV_OPTAB];
 139
 140       if (d->libcall_gen == NULL)
 141         return NULL;
 142
 143       d->libcall_gen (optab, d->libcall_basename, mode1, mode2);
 144       slot = libfunc_hash->find_slot (&e, NO_INSERT);
 145       if (!slot)
 146         return NULL;
 147     }
 148   return (*slot)->libfunc;
 149 }
 150
 151 /* Return libfunc corresponding operation defined by OPTAB in MODE.
 152    Trigger lazy initialization if needed, return NULL if no libfunc is
 153    available.  */
 154 rtx
 155 optab_libfunc (optab optab, machine_mode mode)
 156 {
 157   struct libfunc_entry e;
 158   struct libfunc_entry **slot;
 159
 160   /* ??? This ought to be an assert, but not all of the places
 161      that we expand optabs know about the optabs that got moved
 162      to being direct.  */
 163   if (!(optab >= FIRST_NORM_OPTAB && optab <= LAST_NORMLIB_OPTAB))
 164     return NULL_RTX;
 165
 166   e.op = optab;
 167   e.mode1 = mode;
 168   e.mode2 = VOIDmode;
 169   slot = libfunc_hash->find_slot (&e, NO_INSERT);
 170   if (!slot)
 171     {
 172       const struct optab_libcall_d *d
 173         = &normlib_def[optab - FIRST_NORM_OPTAB];
 174
 175       if (d->libcall_gen == NULL)
 176         return NULL;
 177
 178       d->libcall_gen (optab, d->libcall_basename, d->libcall_suffix, mode);
 179       slot = libfunc_hash->find_slot (&e, NO_INSERT);
 180       if (!slot)
 181         return NULL;
 182     }
 183   return (*slot)->libfunc;
 184 }
 185
 186 \f
 187 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
 188    the result of operation CODE applied to OP0 (and OP1 if it is a binary
 189    operation).
 190
 191    If the last insn does not set TARGET, don't do anything, but return 1.
 192
 193    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
 194    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
 195    try again, ensuring that TARGET is not one of the operands.  */
 196
 197 static int
 198 add_equal_note (rtx_insn *insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
 199 {
 200   rtx_insn *last_insn;
 201   rtx set;
 202   rtx note;
 203
 204   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
 205
 206   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
 207       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
 208       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
 209       && GET_RTX_CLASS (code) != RTX_COMPARE
 210       && GET_RTX_CLASS (code) != RTX_UNARY)
 211     return 1;
 212
 213   if (GET_CODE (target) == ZERO_EXTRACT)
 214     return 1;
 215
 216   for (last_insn = insns;
 217        NEXT_INSN (last_insn) != NULL_RTX;
 218        last_insn = NEXT_INSN (last_insn))
 219     ;
 220
 221   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
 222      a value changing in the insn, so the note would be invalid for CSE.  */
 223   if (reg_overlap_mentioned_p (target, op0)
 224       || (op1 && reg_overlap_mentioned_p (target, op1)))
 225     {
 226       if (MEM_P (target)
 227           && (rtx_equal_p (target, op0)
 228               || (op1 && rtx_equal_p (target, op1))))
 229         {
 230           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 231              over expanding it as temp = MEM op X, MEM = temp.  If the target
 232              supports MEM = MEM op X instructions, it is sometimes too hard
 233              to reconstruct that form later, especially if X is also a memory,
 234              and due to multiple occurrences of addresses the address might
 235              be forced into register unnecessarily.
 236              Note that not emitting the REG_EQUIV note might inhibit
 237              CSE in some cases.  */
 238           set = single_set (last_insn);
 239           if (set
 240               && GET_CODE (SET_SRC (set)) == code
 241               && MEM_P (SET_DEST (set))
 242               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 243                   || (op1 && rtx_equal_p (SET_DEST (set),
 244                                           XEXP (SET_SRC (set), 1)))))
 245             return 1;
 246         }
 247       return 0;
 248     }
 249
 250   set = set_for_reg_notes (last_insn);
 251   if (set == NULL_RTX)
 252     return 1;
 253
 254   if (! rtx_equal_p (SET_DEST (set), target)
 255       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 256       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 257           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 258     return 1;
 259
 260   if (GET_RTX_CLASS (code) == RTX_UNARY)
 261     switch (code)
 262       {
 263       case FFS:
 264       case CLZ:
 265       case CTZ:
 266       case CLRSB:
 267       case POPCOUNT:
 268       case PARITY:
 269       case BSWAP:
 270         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 271           {
 272             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 273             if (GET_MODE_SIZE (GET_MODE (op0))
 274                 > GET_MODE_SIZE (GET_MODE (target)))
 275               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 276                                          note, GET_MODE (op0));
 277             else
 278               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 279                                          note, GET_MODE (op0));
 280             break;
 281           }
 282         /* FALLTHRU */
 283       default:
 284         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 285         break;
 286       }
 287   else
 288     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 289
 290   set_unique_reg_note (last_insn, REG_EQUAL, note);
 291
 292   return 1;
 293 }
 294 \f
 295 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 296    for a widening operation would be.  In most cases this would be OP0, but if
 297    that's a constant it'll be VOIDmode, which isn't useful.  */
 298
 299 static machine_mode
 300 widened_mode (machine_mode to_mode, rtx op0, rtx op1)
 301 {
 302   machine_mode m0 = GET_MODE (op0);
 303   machine_mode m1 = GET_MODE (op1);
 304   machine_mode result;
 305
 306   if (m0 == VOIDmode && m1 == VOIDmode)
 307     return to_mode;
 308   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 309     result = m1;
 310   else
 311     result = m0;
 312
 313   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 314     return to_mode;
 315
 316   return result;
 317 }
 318 \f
 319 /* Like optab_handler, but for widening_operations that have a
 320    TO_MODE and a FROM_MODE.  */
 321
 322 enum insn_code
 323 widening_optab_handler (optab op, machine_mode to_mode,
 324                         machine_mode from_mode)
 325 {
 326   unsigned scode = (op << 16) | to_mode;
 327   if (to_mode != from_mode && from_mode != VOIDmode)
 328     {
 329       /* ??? Why does find_widening_optab_handler_and_mode attempt to
 330          widen things that can't be widened?  E.g. add_optab... */
 331       if (op > LAST_CONV_OPTAB)
 332         return CODE_FOR_nothing;
 333       scode |= from_mode << 8;
 334     }
 335   return raw_optab_handler (scode);
 336 }
 337
 338 /* Find a widening optab even if it doesn't widen as much as we want.
 339    E.g. if from_mode is HImode, and to_mode is DImode, and there is no
 340    direct HI->SI insn, then return SI->DI, if that exists.
 341    If PERMIT_NON_WIDENING is non-zero then this can be used with
 342    non-widening optabs also.  */
 343
 344 enum insn_code
 345 find_widening_optab_handler_and_mode (optab op, machine_mode to_mode,
 346                                       machine_mode from_mode,
 347                                       int permit_non_widening,
 348                                       machine_mode *found_mode)
 349 {
 350   for (; (permit_non_widening || from_mode != to_mode)
 351          && GET_MODE_SIZE (from_mode) <= GET_MODE_SIZE (to_mode)
 352          && from_mode != VOIDmode;
 353        from_mode = GET_MODE_WIDER_MODE (from_mode))
 354     {
 355       enum insn_code handler = widening_optab_handler (op, to_mode,
 356                                                        from_mode);
 357
 358       if (handler != CODE_FOR_nothing)
 359         {
 360           if (found_mode)
 361             *found_mode = from_mode;
 362           return handler;
 363         }
 364     }
 365
 366   return CODE_FOR_nothing;
 367 }
 368 \f
 369 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 370    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 371    not actually do a sign-extend or zero-extend, but can leave the
 372    higher-order bits of the result rtx undefined, for example, in the case
 373    of logical operations, but not right shifts.  */
 374
 375 static rtx
 376 widen_operand (rtx op, machine_mode mode, machine_mode oldmode,
 377                int unsignedp, int no_extend)
 378 {
 379   rtx result;
 380
 381   /* If we don't have to extend and this is a constant, return it.  */
 382   if (no_extend && GET_MODE (op) == VOIDmode)
 383     return op;
 384
 385   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 386      extend since it will be more efficient to do so unless the signedness of
 387      a promoted object differs from our extension.  */
 388   if (! no_extend
 389       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 390           && SUBREG_CHECK_PROMOTED_SIGN (op, unsignedp)))
 391     return convert_modes (mode, oldmode, op, unsignedp);
 392
 393   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 394      SUBREG.  */
 395   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
 396     return gen_lowpart (mode, force_reg (GET_MODE (op), op));
 397
 398   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 399      part to OP.  */
 400
 401   result = gen_reg_rtx (mode);
 402   emit_clobber (result);
 403   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 404   return result;
 405 }
 406 \f
 407 /* Return the optab used for computing the operation given by the tree code,
 408    CODE and the tree EXP.  This function is not always usable (for example, it
 409    cannot give complete results for multiplication or division) but probably
 410    ought to be relied on more widely throughout the expander.  */
 411 optab
 412 optab_for_tree_code (enum tree_code code, const_tree type,
 413                      enum optab_subtype subtype)
 414 {
 415   bool trapv;
 416   switch (code)
 417     {
 418     case BIT_AND_EXPR:
 419       return and_optab;
 420
 421     case BIT_IOR_EXPR:
 422       return ior_optab;
 423
 424     case BIT_NOT_EXPR:
 425       return one_cmpl_optab;
 426
 427     case BIT_XOR_EXPR:
 428       return xor_optab;
 429
 430     case MULT_HIGHPART_EXPR:
 431       return TYPE_UNSIGNED (type) ? umul_highpart_optab : smul_highpart_optab;
 432
 433     case TRUNC_MOD_EXPR:
 434     case CEIL_MOD_EXPR:
 435     case FLOOR_MOD_EXPR:
 436     case ROUND_MOD_EXPR:
 437       return TYPE_UNSIGNED (type) ? umod_optab : smod_optab;
 438
 439     case RDIV_EXPR:
 440     case TRUNC_DIV_EXPR:
 441     case CEIL_DIV_EXPR:
 442     case FLOOR_DIV_EXPR:
 443     case ROUND_DIV_EXPR:
 444     case EXACT_DIV_EXPR:
 445       if (TYPE_SATURATING (type))
 446         return TYPE_UNSIGNED (type) ? usdiv_optab : ssdiv_optab;
 447       return TYPE_UNSIGNED (type) ? udiv_optab : sdiv_optab;
 448
 449     case LSHIFT_EXPR:
 450       if (TREE_CODE (type) == VECTOR_TYPE)
 451         {
 452           if (subtype == optab_vector)
 453             return TYPE_SATURATING (type) ? unknown_optab : vashl_optab;
 454
 455           gcc_assert (subtype == optab_scalar);
 456         }
 457       if (TYPE_SATURATING (type))
 458         return TYPE_UNSIGNED (type) ? usashl_optab : ssashl_optab;
 459       return ashl_optab;
 460
 461     case RSHIFT_EXPR:
 462       if (TREE_CODE (type) == VECTOR_TYPE)
 463         {
 464           if (subtype == optab_vector)
 465             return TYPE_UNSIGNED (type) ? vlshr_optab : vashr_optab;
 466
 467           gcc_assert (subtype == optab_scalar);
 468         }
 469       return TYPE_UNSIGNED (type) ? lshr_optab : ashr_optab;
 470
 471     case LROTATE_EXPR:
 472       if (TREE_CODE (type) == VECTOR_TYPE)
 473         {
 474           if (subtype == optab_vector)
 475             return vrotl_optab;
 476
 477           gcc_assert (subtype == optab_scalar);
 478         }
 479       return rotl_optab;
 480
 481     case RROTATE_EXPR:
 482       if (TREE_CODE (type) == VECTOR_TYPE)
 483         {
 484           if (subtype == optab_vector)
 485             return vrotr_optab;
 486
 487           gcc_assert (subtype == optab_scalar);
 488         }
 489       return rotr_optab;
 490
 491     case MAX_EXPR:
 492       return TYPE_UNSIGNED (type) ? umax_optab : smax_optab;
 493
 494     case MIN_EXPR:
 495       return TYPE_UNSIGNED (type) ? umin_optab : smin_optab;
 496
 497     case REALIGN_LOAD_EXPR:
 498       return vec_realign_load_optab;
 499
 500     case WIDEN_SUM_EXPR:
 501       return TYPE_UNSIGNED (type) ? usum_widen_optab : ssum_widen_optab;
 502
 503     case DOT_PROD_EXPR:
 504       return TYPE_UNSIGNED (type) ? udot_prod_optab : sdot_prod_optab;
 505
 506     case SAD_EXPR:
 507       return TYPE_UNSIGNED (type) ? usad_optab : ssad_optab;
 508
 509     case WIDEN_MULT_PLUS_EXPR:
 510       return (TYPE_UNSIGNED (type)
 511               ? (TYPE_SATURATING (type)
 512                  ? usmadd_widen_optab : umadd_widen_optab)
 513               : (TYPE_SATURATING (type)
 514                  ? ssmadd_widen_optab : smadd_widen_optab));
 515
 516     case WIDEN_MULT_MINUS_EXPR:
 517       return (TYPE_UNSIGNED (type)
 518               ? (TYPE_SATURATING (type)
 519                  ? usmsub_widen_optab : umsub_widen_optab)
 520               : (TYPE_SATURATING (type)
 521                  ? ssmsub_widen_optab : smsub_widen_optab));
 522
 523     case FMA_EXPR:
 524       return fma_optab;
 525
 526     case REDUC_MAX_EXPR:
 527       return TYPE_UNSIGNED (type)
 528              ? reduc_umax_scal_optab : reduc_smax_scal_optab;
 529
 530     case REDUC_MIN_EXPR:
 531       return TYPE_UNSIGNED (type)
 532              ? reduc_umin_scal_optab : reduc_smin_scal_optab;
 533
 534     case REDUC_PLUS_EXPR:
 535       return reduc_plus_scal_optab;
 536
 537     case VEC_WIDEN_MULT_HI_EXPR:
 538       return TYPE_UNSIGNED (type) ?
 539         vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
 540
 541     case VEC_WIDEN_MULT_LO_EXPR:
 542       return TYPE_UNSIGNED (type) ?
 543         vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
 544
 545     case VEC_WIDEN_MULT_EVEN_EXPR:
 546       return TYPE_UNSIGNED (type) ?
 547         vec_widen_umult_even_optab : vec_widen_smult_even_optab;
 548
 549     case VEC_WIDEN_MULT_ODD_EXPR:
 550       return TYPE_UNSIGNED (type) ?
 551         vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
 552
 553     case VEC_WIDEN_LSHIFT_HI_EXPR:
 554       return TYPE_UNSIGNED (type) ?
 555         vec_widen_ushiftl_hi_optab : vec_widen_sshiftl_hi_optab;
 556
 557     case VEC_WIDEN_LSHIFT_LO_EXPR:
 558       return TYPE_UNSIGNED (type) ?
 559         vec_widen_ushiftl_lo_optab : vec_widen_sshiftl_lo_optab;
 560
 561     case VEC_UNPACK_HI_EXPR:
 562       return TYPE_UNSIGNED (type) ?
 563         vec_unpacku_hi_optab : vec_unpacks_hi_optab;
 564
 565     case VEC_UNPACK_LO_EXPR:
 566       return TYPE_UNSIGNED (type) ?
 567         vec_unpacku_lo_optab : vec_unpacks_lo_optab;
 568
 569     case VEC_UNPACK_FLOAT_HI_EXPR:
 570       /* The signedness is determined from input operand.  */
 571       return TYPE_UNSIGNED (type) ?
 572         vec_unpacku_float_hi_optab : vec_unpacks_float_hi_optab;
 573
 574     case VEC_UNPACK_FLOAT_LO_EXPR:
 575       /* The signedness is determined from input operand.  */
 576       return TYPE_UNSIGNED (type) ?
 577         vec_unpacku_float_lo_optab : vec_unpacks_float_lo_optab;
 578
 579     case VEC_PACK_TRUNC_EXPR:
 580       return vec_pack_trunc_optab;
 581
 582     case VEC_PACK_SAT_EXPR:
 583       return TYPE_UNSIGNED (type) ? vec_pack_usat_optab : vec_pack_ssat_optab;
 584
 585     case VEC_PACK_FIX_TRUNC_EXPR:
 586       /* The signedness is determined from output operand.  */
 587       return TYPE_UNSIGNED (type) ?
 588         vec_pack_ufix_trunc_optab : vec_pack_sfix_trunc_optab;
 589
 590     default:
 591       break;
 592     }
 593
 594   trapv = INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type);
 595   switch (code)
 596     {
 597     case POINTER_PLUS_EXPR:
 598     case PLUS_EXPR:
 599       if (TYPE_SATURATING (type))
 600         return TYPE_UNSIGNED (type) ? usadd_optab : ssadd_optab;
 601       return trapv ? addv_optab : add_optab;
 602
 603     case MINUS_EXPR:
 604       if (TYPE_SATURATING (type))
 605         return TYPE_UNSIGNED (type) ? ussub_optab : sssub_optab;
 606       return trapv ? subv_optab : sub_optab;
 607
 608     case MULT_EXPR:
 609       if (TYPE_SATURATING (type))
 610         return TYPE_UNSIGNED (type) ? usmul_optab : ssmul_optab;
 611       return trapv ? smulv_optab : smul_optab;
 612
 613     case NEGATE_EXPR:
 614       if (TYPE_SATURATING (type))
 615         return TYPE_UNSIGNED (type) ? usneg_optab : ssneg_optab;
 616       return trapv ? negv_optab : neg_optab;
 617
 618     case ABS_EXPR:
 619       return trapv ? absv_optab : abs_optab;
 620
 621     default:
 622       return unknown_optab;
 623     }
 624 }
 625
 626 /* Given optab UNOPTAB that reduces a vector to a scalar, find instead the old
 627    optab that produces a vector with the reduction result in one element,
 628    for a tree with type TYPE.  */
 629
 630 optab
 631 scalar_reduc_to_vector (optab unoptab, const_tree type)
 632 {
 633   switch (unoptab)
 634     {
 635     case reduc_plus_scal_optab:
 636       return TYPE_UNSIGNED (type) ? reduc_uplus_optab : reduc_splus_optab;
 637
 638     case reduc_smin_scal_optab: return reduc_smin_optab;
 639     case reduc_umin_scal_optab: return reduc_umin_optab;
 640     case reduc_smax_scal_optab: return reduc_smax_optab;
 641     case reduc_umax_scal_optab: return reduc_umax_optab;
 642     default: return unknown_optab;
 643     }
 644 }
 645
 646 /* Expand vector widening operations.
 647
 648    There are two different classes of operations handled here:
 649    1) Operations whose result is wider than all the arguments to the operation.
 650       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 651       In this case OP0 and optionally OP1 would be initialized,
 652       but WIDE_OP wouldn't (not relevant for this case).
 653    2) Operations whose result is of the same size as the last argument to the
 654       operation, but wider than all the other arguments to the operation.
 655       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 656       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 657
 658    E.g, when called to expand the following operations, this is how
 659    the arguments will be initialized:
 660                                 nops    OP0     OP1     WIDE_OP
 661    widening-sum                 2       oprnd0  -       oprnd1
 662    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 663    widening-mult                2       oprnd0  oprnd1  -
 664    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 665
 666 rtx
 667 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 668                            rtx target, int unsignedp)
 669 {
 670   struct expand_operand eops[4];
 671   tree oprnd0, oprnd1, oprnd2;
 672   machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 673   optab widen_pattern_optab;
 674   enum insn_code icode;
 675   int nops = TREE_CODE_LENGTH (ops->code);
 676   int op;
 677
 678   oprnd0 = ops->op0;
 679   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 680   widen_pattern_optab =
 681     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 682   if (ops->code == WIDEN_MULT_PLUS_EXPR
 683       || ops->code == WIDEN_MULT_MINUS_EXPR)
 684     icode = find_widening_optab_handler (widen_pattern_optab,
 685                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 686                                          tmode0, 0);
 687   else
 688     icode = optab_handler (widen_pattern_optab, tmode0);
 689   gcc_assert (icode != CODE_FOR_nothing);
 690
 691   if (nops >= 2)
 692     {
 693       oprnd1 = ops->op1;
 694       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 695     }
 696
 697   /* The last operand is of a wider mode than the rest of the operands.  */
 698   if (nops == 2)
 699     wmode = tmode1;
 700   else if (nops == 3)
 701     {
 702       gcc_assert (tmode1 == tmode0);
 703       gcc_assert (op1);
 704       oprnd2 = ops->op2;
 705       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 706     }
 707
 708   op = 0;
 709   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 710   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 711   if (op1)
 712     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 713   if (wide_op)
 714     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 715   expand_insn (icode, op, eops);
 716   return eops[0].value;
 717 }
 718
 719 /* Generate code to perform an operation specified by TERNARY_OPTAB
 720    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 721
 722    UNSIGNEDP is for the case where we have to widen the operands
 723    to perform the operation.  It says to use zero-extension.
 724
 725    If TARGET is nonzero, the value
 726    is generated there, if it is convenient to do so.
 727    In all cases an rtx is returned for the locus of the value;
 728    this may or may not be TARGET.  */
 729
 730 rtx
 731 expand_ternary_op (machine_mode mode, optab ternary_optab, rtx op0,
 732                    rtx op1, rtx op2, rtx target, int unsignedp)
 733 {
 734   struct expand_operand ops[4];
 735   enum insn_code icode = optab_handler (ternary_optab, mode);
 736
 737   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 738
 739   create_output_operand (&ops[0], target, mode);
 740   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 741   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 742   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 743   expand_insn (icode, 4, ops);
 744   return ops[0].value;
 745 }
 746
 747
 748 /* Like expand_binop, but return a constant rtx if the result can be
 749    calculated at compile time.  The arguments and return value are
 750    otherwise the same as for expand_binop.  */
 751
 752 rtx
 753 simplify_expand_binop (machine_mode mode, optab binoptab,
 754                        rtx op0, rtx op1, rtx target, int unsignedp,
 755                        enum optab_methods methods)
 756 {
 757   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 758     {
 759       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 760                                          mode, op0, op1);
 761       if (x)
 762         return x;
 763     }
 764
 765   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 766 }
 767
 768 /* Like simplify_expand_binop, but always put the result in TARGET.
 769    Return true if the expansion succeeded.  */
 770
 771 bool
 772 force_expand_binop (machine_mode mode, optab binoptab,
 773                     rtx op0, rtx op1, rtx target, int unsignedp,
 774                     enum optab_methods methods)
 775 {
 776   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 777                                  target, unsignedp, methods);
 778   if (x == 0)
 779     return false;
 780   if (x != target)
 781     emit_move_insn (target, x);
 782   return true;
 783 }
 784
 785 /* Create a new vector value in VMODE with all elements set to OP.  The
 786    mode of OP must be the element mode of VMODE.  If OP is a constant,
 787    then the return value will be a constant.  */
 788
 789 static rtx
 790 expand_vector_broadcast (machine_mode vmode, rtx op)
 791 {
 792   enum insn_code icode;
 793   rtvec vec;
 794   rtx ret;
 795   int i, n;
 796
 797   gcc_checking_assert (VECTOR_MODE_P (vmode));
 798
 799   n = GET_MODE_NUNITS (vmode);
 800   vec = rtvec_alloc (n);
 801   for (i = 0; i < n; ++i)
 802     RTVEC_ELT (vec, i) = op;
 803
 804   if (CONSTANT_P (op))
 805     return gen_rtx_CONST_VECTOR (vmode, vec);
 806
 807   /* ??? If the target doesn't have a vec_init, then we have no easy way
 808      of performing this operation.  Most of this sort of generic support
 809      is hidden away in the vector lowering support in gimple.  */
 810   icode = optab_handler (vec_init_optab, vmode);
 811   if (icode == CODE_FOR_nothing)
 812     return NULL;
 813
 814   ret = gen_reg_rtx (vmode);
 815   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 816
 817   return ret;
 818 }
 819
 820 /* This subroutine of expand_doubleword_shift handles the cases in which
 821    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 822    value are the same as for the parent routine, except that SUPERWORD_OP1
 823    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 824    INTO_TARGET may be null if the caller has decided to calculate it.  */
 825
 826 static bool
 827 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 828                         rtx outof_target, rtx into_target,
 829                         int unsignedp, enum optab_methods methods)
 830 {
 831   if (into_target != 0)
 832     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 833                              into_target, unsignedp, methods))
 834       return false;
 835
 836   if (outof_target != 0)
 837     {
 838       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 839          of the sign bit, otherwise we must fill it with zeros.  */
 840       if (binoptab != ashr_optab)
 841         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 842       else
 843         if (!force_expand_binop (word_mode, binoptab,
 844                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 845                                  outof_target, unsignedp, methods))
 846           return false;
 847     }
 848   return true;
 849 }
 850
 851 /* This subroutine of expand_doubleword_shift handles the cases in which
 852    the effective shift value is < BITS_PER_WORD.  The arguments and return
 853    value are the same as for the parent routine.  */
 854
 855 static bool
 856 expand_subword_shift (machine_mode op1_mode, optab binoptab,
 857                       rtx outof_input, rtx into_input, rtx op1,
 858                       rtx outof_target, rtx into_target,
 859                       int unsignedp, enum optab_methods methods,
 860                       unsigned HOST_WIDE_INT shift_mask)
 861 {
 862   optab reverse_unsigned_shift, unsigned_shift;
 863   rtx tmp, carries;
 864
 865   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 866   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 867
 868   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 869      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 870      the opposite direction to BINOPTAB.  */
 871   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 872     {
 873       carries = outof_input;
 874       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 875                                             op1_mode), op1_mode);
 876       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 877                                    0, true, methods);
 878     }
 879   else
 880     {
 881       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 882          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 883          has unknown behavior.  Do a single shift first, then shift by the
 884          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 885          are truncated to the mode size.  */
 886       carries = expand_binop (word_mode, reverse_unsigned_shift,
 887                               outof_input, const1_rtx, 0, unsignedp, methods);
 888       if (shift_mask == BITS_PER_WORD - 1)
 889         {
 890           tmp = immed_wide_int_const
 891             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 892           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 893                                        0, true, methods);
 894         }
 895       else
 896         {
 897           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 898                                                 op1_mode), op1_mode);
 899           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 900                                        0, true, methods);
 901         }
 902     }
 903   if (tmp == 0 || carries == 0)
 904     return false;
 905   carries = expand_binop (word_mode, reverse_unsigned_shift,
 906                           carries, tmp, 0, unsignedp, methods);
 907   if (carries == 0)
 908     return false;
 909
 910   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 911      so the result can go directly into INTO_TARGET if convenient.  */
 912   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 913                       into_target, unsignedp, methods);
 914   if (tmp == 0)
 915     return false;
 916
 917   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 918   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 919                            into_target, unsignedp, methods))
 920     return false;
 921
 922   /* Use a standard word_mode shift for the out-of half.  */
 923   if (outof_target != 0)
 924     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 925                              outof_target, unsignedp, methods))
 926       return false;
 927
 928   return true;
 929 }
 930
 931
 932 #ifdef HAVE_conditional_move
 933 /* Try implementing expand_doubleword_shift using conditional moves.
 934    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 935    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 936    are the shift counts to use in the former and latter case.  All other
 937    arguments are the same as the parent routine.  */
 938
 939 static bool
 940 expand_doubleword_shift_condmove (machine_mode op1_mode, optab binoptab,
 941                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 942                                   rtx outof_input, rtx into_input,
 943                                   rtx subword_op1, rtx superword_op1,
 944                                   rtx outof_target, rtx into_target,
 945                                   int unsignedp, enum optab_methods methods,
 946                                   unsigned HOST_WIDE_INT shift_mask)
 947 {
 948   rtx outof_superword, into_superword;
 949
 950   /* Put the superword version of the output into OUTOF_SUPERWORD and
 951      INTO_SUPERWORD.  */
 952   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 953   if (outof_target != 0 && subword_op1 == superword_op1)
 954     {
 955       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 956          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 957       into_superword = outof_target;
 958       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 959                                    outof_superword, 0, unsignedp, methods))
 960         return false;
 961     }
 962   else
 963     {
 964       into_superword = gen_reg_rtx (word_mode);
 965       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 966                                    outof_superword, into_superword,
 967                                    unsignedp, methods))
 968         return false;
 969     }
 970
 971   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 972   if (!expand_subword_shift (op1_mode, binoptab,
 973                              outof_input, into_input, subword_op1,
 974                              outof_target, into_target,
 975                              unsignedp, methods, shift_mask))
 976     return false;
 977
 978   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 979      might be the current value of OUTOF_TARGET.  */
 980   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 981                               into_target, into_superword, word_mode, false))
 982     return false;
 983
 984   if (outof_target != 0)
 985     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 986                                 outof_target, outof_superword,
 987                                 word_mode, false))
 988       return false;
 989
 990   return true;
 991 }
 992 #endif
 993
 994 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 995    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 996    input operand; the shift moves bits in the direction OUTOF_INPUT->
 997    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 998    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 999    If OP1 is constant, it will have been truncated as appropriate
1000    and is known to be nonzero.
1001
1002    If SHIFT_MASK is zero, the result of word shifts is undefined when the
1003    shift count is outside the range [0, BITS_PER_WORD).  This routine must
1004    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
1005
1006    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
1007    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
1008    fill with zeros or sign bits as appropriate.
1009
1010    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
1011    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
1012    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
1013    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
1014    are undefined.
1015
1016    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
1017    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
1018    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
1019    function wants to calculate it itself.
1020
1021    Return true if the shift could be successfully synthesized.  */
1022
1023 static bool
1024 expand_doubleword_shift (machine_mode op1_mode, optab binoptab,
1025                          rtx outof_input, rtx into_input, rtx op1,
1026                          rtx outof_target, rtx into_target,
1027                          int unsignedp, enum optab_methods methods,
1028                          unsigned HOST_WIDE_INT shift_mask)
1029 {
1030   rtx superword_op1, tmp, cmp1, cmp2;
1031   enum rtx_code cmp_code;
1032
1033   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
1034      fill the result with sign or zero bits as appropriate.  If so, the value
1035      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
1036      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
1037      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
1038
1039      This isn't worthwhile for constant shifts since the optimizers will
1040      cope better with in-range shift counts.  */
1041   if (shift_mask >= BITS_PER_WORD
1042       && outof_target != 0
1043       && !CONSTANT_P (op1))
1044     {
1045       if (!expand_doubleword_shift (op1_mode, binoptab,
1046                                     outof_input, into_input, op1,
1047                                     0, into_target,
1048                                     unsignedp, methods, shift_mask))
1049         return false;
1050       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
1051                                outof_target, unsignedp, methods))
1052         return false;
1053       return true;
1054     }
1055
1056   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
1057      is true when the effective shift value is less than BITS_PER_WORD.
1058      Set SUPERWORD_OP1 to the shift count that should be used to shift
1059      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
1060   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
1061   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
1062     {
1063       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
1064          is a subword shift count.  */
1065       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
1066                                     0, true, methods);
1067       cmp2 = CONST0_RTX (op1_mode);
1068       cmp_code = EQ;
1069       superword_op1 = op1;
1070     }
1071   else
1072     {
1073       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
1074       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
1075                                     0, true, methods);
1076       cmp2 = CONST0_RTX (op1_mode);
1077       cmp_code = LT;
1078       superword_op1 = cmp1;
1079     }
1080   if (cmp1 == 0)
1081     return false;
1082
1083   /* If we can compute the condition at compile time, pick the
1084      appropriate subroutine.  */
1085   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
1086   if (tmp != 0 && CONST_INT_P (tmp))
1087     {
1088       if (tmp == const0_rtx)
1089         return expand_superword_shift (binoptab, outof_input, superword_op1,
1090                                        outof_target, into_target,
1091                                        unsignedp, methods);
1092       else
1093         return expand_subword_shift (op1_mode, binoptab,
1094                                      outof_input, into_input, op1,
1095                                      outof_target, into_target,
1096                                      unsignedp, methods, shift_mask);
1097     }
1098
1099 #ifdef HAVE_conditional_move
1100   /* Try using conditional moves to generate straight-line code.  */
1101   {
1102     rtx_insn *start = get_last_insn ();
1103     if (expand_doubleword_shift_condmove (op1_mode, binoptab,
1104                                           cmp_code, cmp1, cmp2,
1105                                           outof_input, into_input,
1106                                           op1, superword_op1,
1107                                           outof_target, into_target,
1108                                           unsignedp, methods, shift_mask))
1109       return true;
1110     delete_insns_since (start);
1111   }
1112 #endif
1113
1114   /* As a last resort, use branches to select the correct alternative.  */
1115   rtx_code_label *subword_label = gen_label_rtx ();
1116   rtx_code_label *done_label = gen_label_rtx ();
1117
1118   NO_DEFER_POP;
1119   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
1120                            0, 0, subword_label, -1);
1121   OK_DEFER_POP;
1122
1123   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
1124                                outof_target, into_target,
1125                                unsignedp, methods))
1126     return false;
1127
1128   emit_jump_insn (gen_jump (done_label));
1129   emit_barrier ();
1130   emit_label (subword_label);
1131
1132   if (!expand_subword_shift (op1_mode, binoptab,
1133                              outof_input, into_input, op1,
1134                              outof_target, into_target,
1135                              unsignedp, methods, shift_mask))
1136     return false;
1137
1138   emit_label (done_label);
1139   return true;
1140 }
1141 \f
1142 /* Subroutine of expand_binop.  Perform a double word multiplication of
1143    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
1144    as the target's word_mode.  This function return NULL_RTX if anything
1145    goes wrong, in which case it may have already emitted instructions
1146    which need to be deleted.
1147
1148    If we want to multiply two two-word values and have normal and widening
1149    multiplies of single-word values, we can do this with three smaller
1150    multiplications.
1151
1152    The multiplication proceeds as follows:
1153                                  _______________________
1154                                 [__op0_high_|__op0_low__]
1155                                  _______________________
1156         *                       [__op1_high_|__op1_low__]
1157         _______________________________________________
1158                                  _______________________
1159     (1)                         [__op0_low__*__op1_low__]
1160                      _______________________
1161     (2a)            [__op0_low__*__op1_high_]
1162                      _______________________
1163     (2b)            [__op0_high_*__op1_low__]
1164          _______________________
1165     (3) [__op0_high_*__op1_high_]
1166
1167
1168   This gives a 4-word result.  Since we are only interested in the
1169   lower 2 words, partial result (3) and the upper words of (2a) and
1170   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
1171   calculated using non-widening multiplication.
1172
1173   (1), however, needs to be calculated with an unsigned widening
1174   multiplication.  If this operation is not directly supported we
1175   try using a signed widening multiplication and adjust the result.
1176   This adjustment works as follows:
1177
1178       If both operands are positive then no adjustment is needed.
1179
1180       If the operands have different signs, for example op0_low < 0 and
1181       op1_low >= 0, the instruction treats the most significant bit of
1182       op0_low as a sign bit instead of a bit with significance
1183       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
1184       with 2**BITS_PER_WORD - op0_low, and two's complements the
1185       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
1186       the result.
1187
1188       Similarly, if both operands are negative, we need to add
1189       (op0_low + op1_low) * 2**BITS_PER_WORD.
1190
1191       We use a trick to adjust quickly.  We logically shift op0_low right
1192       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
1193       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
1194       logical shift exists, we do an arithmetic right shift and subtract
1195       the 0 or -1.  */
1196
1197 static rtx
1198 expand_doubleword_mult (machine_mode mode, rtx op0, rtx op1, rtx target,
1199                        bool umulp, enum optab_methods methods)
1200 {
1201   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
1202   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
1203   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
1204   rtx product, adjust, product_high, temp;
1205
1206   rtx op0_high = operand_subword_force (op0, high, mode);
1207   rtx op0_low = operand_subword_force (op0, low, mode);
1208   rtx op1_high = operand_subword_force (op1, high, mode);
1209   rtx op1_low = operand_subword_force (op1, low, mode);
1210
1211   /* If we're using an unsigned multiply to directly compute the product
1212      of the low-order words of the operands and perform any required
1213      adjustments of the operands, we begin by trying two more multiplications
1214      and then computing the appropriate sum.
1215
1216      We have checked above that the required addition is provided.
1217      Full-word addition will normally always succeed, especially if
1218      it is provided at all, so we don't worry about its failure.  The
1219      multiplication may well fail, however, so we do handle that.  */
1220
1221   if (!umulp)
1222     {
1223       /* ??? This could be done with emit_store_flag where available.  */
1224       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
1225                            NULL_RTX, 1, methods);
1226       if (temp)
1227         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
1228                                  NULL_RTX, 0, OPTAB_DIRECT);
1229       else
1230         {
1231           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
1232                                NULL_RTX, 0, methods);
1233           if (!temp)
1234             return NULL_RTX;
1235           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
1236                                    NULL_RTX, 0, OPTAB_DIRECT);
1237         }
1238
1239       if (!op0_high)
1240         return NULL_RTX;
1241     }
1242
1243   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
1244                          NULL_RTX, 0, OPTAB_DIRECT);
1245   if (!adjust)
1246     return NULL_RTX;
1247
1248   /* OP0_HIGH should now be dead.  */
1249
1250   if (!umulp)
1251     {
1252       /* ??? This could be done with emit_store_flag where available.  */
1253       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
1254                            NULL_RTX, 1, methods);
1255       if (temp)
1256         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
1257                                  NULL_RTX, 0, OPTAB_DIRECT);
1258       else
1259         {
1260           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
1261                                NULL_RTX, 0, methods);
1262           if (!temp)
1263             return NULL_RTX;
1264           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
1265                                    NULL_RTX, 0, OPTAB_DIRECT);
1266         }
1267
1268       if (!op1_high)
1269         return NULL_RTX;
1270     }
1271
1272   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
1273                        NULL_RTX, 0, OPTAB_DIRECT);
1274   if (!temp)
1275     return NULL_RTX;
1276
1277   /* OP1_HIGH should now be dead.  */
1278
1279   adjust = expand_binop (word_mode, add_optab, adjust, temp,
1280                          NULL_RTX, 0, OPTAB_DIRECT);
1281
1282   if (target && !REG_P (target))
1283     target = NULL_RTX;
1284
1285   if (umulp)
1286     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
1287                             target, 1, OPTAB_DIRECT);
1288   else
1289     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
1290                             target, 1, OPTAB_DIRECT);
1291
1292   if (!product)
1293     return NULL_RTX;
1294
1295   product_high = operand_subword (product, high, 1, mode);
1296   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
1297                          NULL_RTX, 0, OPTAB_DIRECT);
1298   emit_move_insn (product_high, adjust);
1299   return product;
1300 }
1301 \f
1302 /* Wrapper around expand_binop which takes an rtx code to specify
1303    the operation to perform, not an optab pointer.  All other
1304    arguments are the same.  */
1305 rtx
1306 expand_simple_binop (machine_mode mode, enum rtx_code code, rtx op0,
1307                      rtx op1, rtx target, int unsignedp,
1308                      enum optab_methods methods)
1309 {
1310   optab binop = code_to_optab (code);
1311   gcc_assert (binop);
1312
1313   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
1314 }
1315
1316 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
1317    binop.  Order them according to commutative_operand_precedence and, if
1318    possible, try to put TARGET or a pseudo first.  */
1319 static bool
1320 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
1321 {
1322   int op0_prec = commutative_operand_precedence (op0);
1323   int op1_prec = commutative_operand_precedence (op1);
1324
1325   if (op0_prec < op1_prec)
1326     return true;
1327
1328   if (op0_prec > op1_prec)
1329     return false;
1330
1331   /* With equal precedence, both orders are ok, but it is better if the
1332      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
1333   if (target == 0 || REG_P (target))
1334     return (REG_P (op1) && !REG_P (op0)) || target == op1;
1335   else
1336     return rtx_equal_p (op1, target);
1337 }
1338
1339 /* Return true if BINOPTAB implements a shift operation.  */
1340
1341 static bool
1342 shift_optab_p (optab binoptab)
1343 {
1344   switch (optab_to_code (binoptab))
1345     {
1346     case ASHIFT:
1347     case SS_ASHIFT:
1348     case US_ASHIFT:
1349     case ASHIFTRT:
1350     case LSHIFTRT:
1351     case ROTATE:
1352     case ROTATERT:
1353       return true;
1354
1355     default:
1356       return false;
1357     }
1358 }
1359
1360 /* Return true if BINOPTAB implements a commutative binary operation.  */
1361
1362 static bool
1363 commutative_optab_p (optab binoptab)
1364 {
1365   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
1366           || binoptab == smul_widen_optab
1367           || binoptab == umul_widen_optab
1368           || binoptab == smul_highpart_optab
1369           || binoptab == umul_highpart_optab);
1370 }
1371
1372 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
1373    optimizing, and if the operand is a constant that costs more than
1374    1 instruction, force the constant into a register and return that
1375    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
1376
1377 static rtx
1378 avoid_expensive_constant (machine_mode mode, optab binoptab,
1379                           int opn, rtx x, bool unsignedp)
1380 {
1381   bool speed = optimize_insn_for_speed_p ();
1382
1383   if (mode != VOIDmode
1384       && optimize
1385       && CONSTANT_P (x)
1386       && (rtx_cost (x, optab_to_code (binoptab), opn, speed)
1387           > set_src_cost (x, speed)))
1388     {
1389       if (CONST_INT_P (x))
1390         {
1391           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
1392           if (intval != INTVAL (x))
1393             x = GEN_INT (intval);
1394         }
1395       else
1396         x = convert_modes (mode, VOIDmode, x, unsignedp);
1397       x = force_reg (mode, x);
1398     }
1399   return x;
1400 }
1401
1402 /* Helper function for expand_binop: handle the case where there
1403    is an insn that directly implements the indicated operation.
1404    Returns null if this is not possible.  */
1405 static rtx
1406 expand_binop_directly (machine_mode mode, optab binoptab,
1407                        rtx op0, rtx op1,
1408                        rtx target, int unsignedp, enum optab_methods methods,
1409                        rtx_insn *last)
1410 {
1411   machine_mode from_mode = widened_mode (mode, op0, op1);
1412   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
1413                                                       from_mode, 1);
1414   machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1415   machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1416   machine_mode mode0, mode1, tmp_mode;
1417   struct expand_operand ops[3];
1418   bool commutative_p;
1419   rtx_insn *pat;
1420   rtx xop0 = op0, xop1 = op1;
1421
1422   /* If it is a commutative operator and the modes would match
1423      if we would swap the operands, we can save the conversions.  */
1424   commutative_p = commutative_optab_p (binoptab);
1425   if (commutative_p
1426       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1427       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1428     std::swap (xop0, xop1);
1429
1430   /* If we are optimizing, force expensive constants into a register.  */
1431   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1432   if (!shift_optab_p (binoptab))
1433     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1434
1435   /* In case the insn wants input operands in modes different from
1436      those of the actual operands, convert the operands.  It would
1437      seem that we don't need to convert CONST_INTs, but we do, so
1438      that they're properly zero-extended, sign-extended or truncated
1439      for their mode.  */
1440
1441   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1442   if (xmode0 != VOIDmode && xmode0 != mode0)
1443     {
1444       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1445       mode0 = xmode0;
1446     }
1447
1448   mode1 = GET_MODE (xop1) != VOIDmode ? GET_MODE (xop1) : mode;
1449   if (xmode1 != VOIDmode && xmode1 != mode1)
1450     {
1451       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1452       mode1 = xmode1;
1453     }
1454
1455   /* If operation is commutative,
1456      try to make the first operand a register.
1457      Even better, try to make it the same as the target.
1458      Also try to make the last operand a constant.  */
1459   if (commutative_p
1460       && swap_commutative_operands_with_target (target, xop0, xop1))
1461     std::swap (xop0, xop1);
1462
1463   /* Now, if insn's predicates don't allow our operands, put them into
1464      pseudo regs.  */
1465
1466   if (binoptab == vec_pack_trunc_optab
1467       || binoptab == vec_pack_usat_optab
1468       || binoptab == vec_pack_ssat_optab
1469       || binoptab == vec_pack_ufix_trunc_optab
1470       || binoptab == vec_pack_sfix_trunc_optab)
1471     {
1472       /* The mode of the result is different then the mode of the
1473          arguments.  */
1474       tmp_mode = insn_data[(int) icode].operand[0].mode;
1475       if (GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1476         {
1477           delete_insns_since (last);
1478           return NULL_RTX;
1479         }
1480     }
1481   else
1482     tmp_mode = mode;
1483
1484   create_output_operand (&ops[0], target, tmp_mode);
1485   create_input_operand (&ops[1], xop0, mode0);
1486   create_input_operand (&ops[2], xop1, mode1);
1487   pat = maybe_gen_insn (icode, 3, ops);
1488   if (pat)
1489     {
1490       /* If PAT is composed of more than one insn, try to add an appropriate
1491          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1492          operand, call expand_binop again, this time without a target.  */
1493       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1494           && ! add_equal_note (pat, ops[0].value,
1495                                optab_to_code (binoptab),
1496                                ops[1].value, ops[2].value))
1497         {
1498           delete_insns_since (last);
1499           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1500                                unsignedp, methods);
1501         }
1502
1503       emit_insn (pat);
1504       return ops[0].value;
1505     }
1506   delete_insns_since (last);
1507   return NULL_RTX;
1508 }
1509
1510 /* Generate code to perform an operation specified by BINOPTAB
1511    on operands OP0 and OP1, with result having machine-mode MODE.
1512
1513    UNSIGNEDP is for the case where we have to widen the operands
1514    to perform the operation.  It says to use zero-extension.
1515
1516    If TARGET is nonzero, the value
1517    is generated there, if it is convenient to do so.
1518    In all cases an rtx is returned for the locus of the value;
1519    this may or may not be TARGET.  */
1520
1521 rtx
1522 expand_binop (machine_mode mode, optab binoptab, rtx op0, rtx op1,
1523               rtx target, int unsignedp, enum optab_methods methods)
1524 {
1525   enum optab_methods next_methods
1526     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1527        ? OPTAB_WIDEN : methods);
1528   enum mode_class mclass;
1529   machine_mode wider_mode;
1530   rtx libfunc;
1531   rtx temp;
1532   rtx_insn *entry_last = get_last_insn ();
1533   rtx_insn *last;
1534
1535   mclass = GET_MODE_CLASS (mode);
1536
1537   /* If subtracting an integer constant, convert this into an addition of
1538      the negated constant.  */
1539
1540   if (binoptab == sub_optab && CONST_INT_P (op1))
1541     {
1542       op1 = negate_rtx (mode, op1);
1543       binoptab = add_optab;
1544     }
1545
1546   /* Record where to delete back to if we backtrack.  */
1547   last = get_last_insn ();
1548
1549   /* If we can do it with a three-operand insn, do so.  */
1550
1551   if (methods != OPTAB_MUST_WIDEN
1552       && find_widening_optab_handler (binoptab, mode,
1553                                       widened_mode (mode, op0, op1), 1)
1554             != CODE_FOR_nothing)
1555     {
1556       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1557                                     unsignedp, methods, last);
1558       if (temp)
1559         return temp;
1560     }
1561
1562   /* If we were trying to rotate, and that didn't work, try rotating
1563      the other direction before falling back to shifts and bitwise-or.  */
1564   if (((binoptab == rotl_optab
1565         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1566        || (binoptab == rotr_optab
1567            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1568       && mclass == MODE_INT)
1569     {
1570       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1571       rtx newop1;
1572       unsigned int bits = GET_MODE_PRECISION (mode);
1573
1574       if (CONST_INT_P (op1))
1575         newop1 = GEN_INT (bits - INTVAL (op1));
1576       else if (targetm.shift_truncation_mask (mode) == bits - 1)
1577         newop1 = negate_rtx (GET_MODE (op1), op1);
1578       else
1579         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1580                                gen_int_mode (bits, GET_MODE (op1)), op1,
1581                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1582
1583       temp = expand_binop_directly (mode, otheroptab, op0, newop1,
1584                                     target, unsignedp, methods, last);
1585       if (temp)
1586         return temp;
1587     }
1588
1589   /* If this is a multiply, see if we can do a widening operation that
1590      takes operands of this mode and makes a wider mode.  */
1591
1592   if (binoptab == smul_optab
1593       && GET_MODE_2XWIDER_MODE (mode) != VOIDmode
1594       && (widening_optab_handler ((unsignedp ? umul_widen_optab
1595                                              : smul_widen_optab),
1596                                   GET_MODE_2XWIDER_MODE (mode), mode)
1597           != CODE_FOR_nothing))
1598     {
1599       temp = expand_binop (GET_MODE_2XWIDER_MODE (mode),
1600                            unsignedp ? umul_widen_optab : smul_widen_optab,
1601                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1602
1603       if (temp != 0)
1604         {
1605           if (GET_MODE_CLASS (mode) == MODE_INT
1606               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1607             return gen_lowpart (mode, temp);
1608           else
1609             return convert_to_mode (mode, temp, unsignedp);
1610         }
1611     }
1612
1613   /* If this is a vector shift by a scalar, see if we can do a vector
1614      shift by a vector.  If so, broadcast the scalar into a vector.  */
1615   if (mclass == MODE_VECTOR_INT)
1616     {
1617       optab otheroptab = unknown_optab;
1618
1619       if (binoptab == ashl_optab)
1620         otheroptab = vashl_optab;
1621       else if (binoptab == ashr_optab)
1622         otheroptab = vashr_optab;
1623       else if (binoptab == lshr_optab)
1624         otheroptab = vlshr_optab;
1625       else if (binoptab == rotl_optab)
1626         otheroptab = vrotl_optab;
1627       else if (binoptab == rotr_optab)
1628         otheroptab = vrotr_optab;
1629
1630       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1631         {
1632           rtx vop1 = expand_vector_broadcast (mode, op1);
1633           if (vop1)
1634             {
1635               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1636                                             target, unsignedp, methods, last);
1637               if (temp)
1638                 return temp;
1639             }
1640         }
1641     }
1642
1643   /* Look for a wider mode of the same class for which we think we
1644      can open-code the operation.  Check for a widening multiply at the
1645      wider mode as well.  */
1646
1647   if (CLASS_HAS_WIDER_MODES_P (mclass)
1648       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1649     for (wider_mode = GET_MODE_WIDER_MODE (mode);
1650          wider_mode != VOIDmode;
1651          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
1652       {
1653         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1654             || (binoptab == smul_optab
1655                 && GET_MODE_WIDER_MODE (wider_mode) != VOIDmode
1656                 && (find_widening_optab_handler ((unsignedp
1657                                                   ? umul_widen_optab
1658                                                   : smul_widen_optab),
1659                                                  GET_MODE_WIDER_MODE (wider_mode),
1660                                                  mode, 0)
1661                     != CODE_FOR_nothing)))
1662           {
1663             rtx xop0 = op0, xop1 = op1;
1664             int no_extend = 0;
1665
1666             /* For certain integer operations, we need not actually extend
1667                the narrow operands, as long as we will truncate
1668                the results to the same narrowness.  */
1669
1670             if ((binoptab == ior_optab || binoptab == and_optab
1671                  || binoptab == xor_optab
1672                  || binoptab == add_optab || binoptab == sub_optab
1673                  || binoptab == smul_optab || binoptab == ashl_optab)
1674                 && mclass == MODE_INT)
1675               {
1676                 no_extend = 1;
1677                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1678                                                  xop0, unsignedp);
1679                 if (binoptab != ashl_optab)
1680                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1681                                                    xop1, unsignedp);
1682               }
1683
1684             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1685
1686             /* The second operand of a shift must always be extended.  */
1687             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1688                                   no_extend && binoptab != ashl_optab);
1689
1690             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1691                                  unsignedp, OPTAB_DIRECT);
1692             if (temp)
1693               {
1694                 if (mclass != MODE_INT
1695                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1696                   {
1697                     if (target == 0)
1698                       target = gen_reg_rtx (mode);
1699                     convert_move (target, temp, 0);
1700                     return target;
1701                   }
1702                 else
1703                   return gen_lowpart (mode, temp);
1704               }
1705             else
1706               delete_insns_since (last);
1707           }
1708       }
1709
1710   /* If operation is commutative,
1711      try to make the first operand a register.
1712      Even better, try to make it the same as the target.
1713      Also try to make the last operand a constant.  */
1714   if (commutative_optab_p (binoptab)
1715       && swap_commutative_operands_with_target (target, op0, op1))
1716     std::swap (op0, op1);
1717
1718   /* These can be done a word at a time.  */
1719   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1720       && mclass == MODE_INT
1721       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
1722       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1723     {
1724       int i;
1725       rtx_insn *insns;
1726
1727       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1728          won't be accurate, so use a new target.  */
1729       if (target == 0
1730           || target == op0
1731           || target == op1
1732           || !valid_multiword_target_p (target))
1733         target = gen_reg_rtx (mode);
1734
1735       start_sequence ();
1736
1737       /* Do the actual arithmetic.  */
1738       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
1739         {
1740           rtx target_piece = operand_subword (target, i, 1, mode);
1741           rtx x = expand_binop (word_mode, binoptab,
1742                                 operand_subword_force (op0, i, mode),
1743                                 operand_subword_force (op1, i, mode),
1744                                 target_piece, unsignedp, next_methods);
1745
1746           if (x == 0)
1747             break;
1748
1749           if (target_piece != x)
1750             emit_move_insn (target_piece, x);
1751         }
1752
1753       insns = get_insns ();
1754       end_sequence ();
1755
1756       if (i == GET_MODE_BITSIZE (mode) / BITS_PER_WORD)
1757         {
1758           emit_insn (insns);
1759           return target;
1760         }
1761     }
1762
1763   /* Synthesize double word shifts from single word shifts.  */
1764   if ((binoptab == lshr_optab || binoptab == ashl_optab
1765        || binoptab == ashr_optab)
1766       && mclass == MODE_INT
1767       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1768       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1769       && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode)
1770       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1771       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1772       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1773     {
1774       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1775       machine_mode op1_mode;
1776
1777       double_shift_mask = targetm.shift_truncation_mask (mode);
1778       shift_mask = targetm.shift_truncation_mask (word_mode);
1779       op1_mode = GET_MODE (op1) != VOIDmode ? GET_MODE (op1) : word_mode;
1780
1781       /* Apply the truncation to constant shifts.  */
1782       if (double_shift_mask > 0 && CONST_INT_P (op1))
1783         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1784
1785       if (op1 == CONST0_RTX (op1_mode))
1786         return op0;
1787
1788       /* Make sure that this is a combination that expand_doubleword_shift
1789          can handle.  See the comments there for details.  */
1790       if (double_shift_mask == 0
1791           || (shift_mask == BITS_PER_WORD - 1
1792               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1793         {
1794           rtx_insn *insns;
1795           rtx into_target, outof_target;
1796           rtx into_input, outof_input;
1797           int left_shift, outof_word;
1798
1799           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1800              won't be accurate, so use a new target.  */
1801           if (target == 0
1802               || target == op0
1803               || target == op1
1804               || !valid_multiword_target_p (target))
1805             target = gen_reg_rtx (mode);
1806
1807           start_sequence ();
1808
1809           /* OUTOF_* is the word we are shifting bits away from, and
1810              INTO_* is the word that we are shifting bits towards, thus
1811              they differ depending on the direction of the shift and
1812              WORDS_BIG_ENDIAN.  */
1813
1814           left_shift = binoptab == ashl_optab;
1815           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1816
1817           outof_target = operand_subword (target, outof_word, 1, mode);
1818           into_target = operand_subword (target, 1 - outof_word, 1, mode);
1819
1820           outof_input = operand_subword_force (op0, outof_word, mode);
1821           into_input = operand_subword_force (op0, 1 - outof_word, mode);
1822
1823           if (expand_doubleword_shift (op1_mode, binoptab,
1824                                        outof_input, into_input, op1,
1825                                        outof_target, into_target,
1826                                        unsignedp, next_methods, shift_mask))
1827             {
1828               insns = get_insns ();
1829               end_sequence ();
1830
1831               emit_insn (insns);
1832               return target;
1833             }
1834           end_sequence ();
1835         }
1836     }
1837
1838   /* Synthesize double word rotates from single word shifts.  */
1839   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1840       && mclass == MODE_INT
1841       && CONST_INT_P (op1)
1842       && GET_MODE_PRECISION (mode) == 2 * BITS_PER_WORD
1843       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1844       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1845     {
1846       rtx_insn *insns;
1847       rtx into_target, outof_target;
1848       rtx into_input, outof_input;
1849       rtx inter;
1850       int shift_count, left_shift, outof_word;
1851
1852       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1853          won't be accurate, so use a new target. Do this also if target is not
1854          a REG, first because having a register instead may open optimization
1855          opportunities, and second because if target and op0 happen to be MEMs
1856          designating the same location, we would risk clobbering it too early
1857          in the code sequence we generate below.  */
1858       if (target == 0
1859           || target == op0
1860           || target == op1
1861           || !REG_P (target)
1862           || !valid_multiword_target_p (target))
1863         target = gen_reg_rtx (mode);
1864
1865       start_sequence ();
1866
1867       shift_count = INTVAL (op1);
1868
1869       /* OUTOF_* is the word we are shifting bits away from, and
1870          INTO_* is the word that we are shifting bits towards, thus
1871          they differ depending on the direction of the shift and
1872          WORDS_BIG_ENDIAN.  */
1873
1874       left_shift = (binoptab == rotl_optab);
1875       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1876
1877       outof_target = operand_subword (target, outof_word, 1, mode);
1878       into_target = operand_subword (target, 1 - outof_word, 1, mode);
1879
1880       outof_input = operand_subword_force (op0, outof_word, mode);
1881       into_input = operand_subword_force (op0, 1 - outof_word, mode);
1882
1883       if (shift_count == BITS_PER_WORD)
1884         {
1885           /* This is just a word swap.  */
1886           emit_move_insn (outof_target, into_input);
1887           emit_move_insn (into_target, outof_input);
1888           inter = const0_rtx;
1889         }
1890       else
1891         {
1892           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1893           rtx first_shift_count, second_shift_count;
1894           optab reverse_unsigned_shift, unsigned_shift;
1895
1896           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1897                                     ? lshr_optab : ashl_optab);
1898
1899           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1900                             ? ashl_optab : lshr_optab);
1901
1902           if (shift_count > BITS_PER_WORD)
1903             {
1904               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1905               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1906             }
1907           else
1908             {
1909               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1910               second_shift_count = GEN_INT (shift_count);
1911             }
1912
1913           into_temp1 = expand_binop (word_mode, unsigned_shift,
1914                                      outof_input, first_shift_count,
1915                                      NULL_RTX, unsignedp, next_methods);
1916           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1917                                      into_input, second_shift_count,
1918                                      NULL_RTX, unsignedp, next_methods);
1919
1920           if (into_temp1 != 0 && into_temp2 != 0)
1921             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1922                                   into_target, unsignedp, next_methods);
1923           else
1924             inter = 0;
1925
1926           if (inter != 0 && inter != into_target)
1927             emit_move_insn (into_target, inter);
1928
1929           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1930                                       into_input, first_shift_count,
1931                                       NULL_RTX, unsignedp, next_methods);
1932           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1933                                       outof_input, second_shift_count,
1934                                       NULL_RTX, unsignedp, next_methods);
1935
1936           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1937             inter = expand_binop (word_mode, ior_optab,
1938                                   outof_temp1, outof_temp2,
1939                                   outof_target, unsignedp, next_methods);
1940
1941           if (inter != 0 && inter != outof_target)
1942             emit_move_insn (outof_target, inter);
1943         }
1944
1945       insns = get_insns ();
1946       end_sequence ();
1947
1948       if (inter != 0)
1949         {
1950           emit_insn (insns);
1951           return target;
1952         }
1953     }
1954
1955   /* These can be done a word at a time by propagating carries.  */
1956   if ((binoptab == add_optab || binoptab == sub_optab)
1957       && mclass == MODE_INT
1958       && GET_MODE_SIZE (mode) >= 2 * UNITS_PER_WORD
1959       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1960     {
1961       unsigned int i;
1962       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1963       const unsigned int nwords = GET_MODE_BITSIZE (mode) / BITS_PER_WORD;
1964       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1965       rtx xop0, xop1, xtarget;
1966
1967       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1968          value is one of those, use it.  Otherwise, use 1 since it is the
1969          one easiest to get.  */
1970 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1971       int normalizep = STORE_FLAG_VALUE;
1972 #else
1973       int normalizep = 1;
1974 #endif
1975
1976       /* Prepare the operands.  */
1977       xop0 = force_reg (mode, op0);
1978       xop1 = force_reg (mode, op1);
1979
1980       xtarget = gen_reg_rtx (mode);
1981
1982       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1983         target = xtarget;
1984
1985       /* Indicate for flow that the entire target reg is being set.  */
1986       if (REG_P (target))
1987         emit_clobber (xtarget);
1988
1989       /* Do the actual arithmetic.  */
1990       for (i = 0; i < nwords; i++)
1991         {
1992           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1993           rtx target_piece = operand_subword (xtarget, index, 1, mode);
1994           rtx op0_piece = operand_subword_force (xop0, index, mode);
1995           rtx op1_piece = operand_subword_force (xop1, index, mode);
1996           rtx x;
1997
1998           /* Main add/subtract of the input operands.  */
1999           x = expand_binop (word_mode, binoptab,
2000                             op0_piece, op1_piece,
2001                             target_piece, unsignedp, next_methods);
2002           if (x == 0)
2003             break;
2004
2005           if (i + 1 < nwords)
2006             {
2007               /* Store carry from main add/subtract.  */
2008               carry_out = gen_reg_rtx (word_mode);
2009               carry_out = emit_store_flag_force (carry_out,
2010                                                  (binoptab == add_optab
2011                                                   ? LT : GT),
2012                                                  x, op0_piece,
2013                                                  word_mode, 1, normalizep);
2014             }
2015
2016           if (i > 0)
2017             {
2018               rtx newx;
2019
2020               /* Add/subtract previous carry to main result.  */
2021               newx = expand_binop (word_mode,
2022                                    normalizep == 1 ? binoptab : otheroptab,
2023                                    x, carry_in,
2024                                    NULL_RTX, 1, next_methods);
2025
2026               if (i + 1 < nwords)
2027                 {
2028                   /* Get out carry from adding/subtracting carry in.  */
2029                   rtx carry_tmp = gen_reg_rtx (word_mode);
2030                   carry_tmp = emit_store_flag_force (carry_tmp,
2031                                                      (binoptab == add_optab
2032                                                       ? LT : GT),
2033                                                      newx, x,
2034                                                      word_mode, 1, normalizep);
2035
2036                   /* Logical-ior the two poss. carry together.  */
2037                   carry_out = expand_binop (word_mode, ior_optab,
2038                                             carry_out, carry_tmp,
2039                                             carry_out, 0, next_methods);
2040                   if (carry_out == 0)
2041                     break;
2042                 }
2043               emit_move_insn (target_piece, newx);
2044             }
2045           else
2046             {
2047               if (x != target_piece)
2048                 emit_move_insn (target_piece, x);
2049             }
2050
2051           carry_in = carry_out;
2052         }
2053
2054       if (i == GET_MODE_BITSIZE (mode) / (unsigned) BITS_PER_WORD)
2055         {
2056           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing
2057               || ! rtx_equal_p (target, xtarget))
2058             {
2059               rtx temp = emit_move_insn (target, xtarget);
2060
2061               set_dst_reg_note (temp, REG_EQUAL,
2062                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2063                                                 mode, copy_rtx (xop0),
2064                                                 copy_rtx (xop1)),
2065                                 target);
2066             }
2067           else
2068             target = xtarget;
2069
2070           return target;
2071         }
2072
2073       else
2074         delete_insns_since (last);
2075     }
2076
2077   /* Attempt to synthesize double word multiplies using a sequence of word
2078      mode multiplications.  We first attempt to generate a sequence using a
2079      more efficient unsigned widening multiply, and if that fails we then
2080      try using a signed widening multiply.  */
2081
2082   if (binoptab == smul_optab
2083       && mclass == MODE_INT
2084       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2085       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
2086       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
2087     {
2088       rtx product = NULL_RTX;
2089       if (widening_optab_handler (umul_widen_optab, mode, word_mode)
2090             != CODE_FOR_nothing)
2091         {
2092           product = expand_doubleword_mult (mode, op0, op1, target,
2093                                             true, methods);
2094           if (!product)
2095             delete_insns_since (last);
2096         }
2097
2098       if (product == NULL_RTX
2099           && widening_optab_handler (smul_widen_optab, mode, word_mode)
2100                 != CODE_FOR_nothing)
2101         {
2102           product = expand_doubleword_mult (mode, op0, op1, target,
2103                                             false, methods);
2104           if (!product)
2105             delete_insns_since (last);
2106         }
2107
2108       if (product != NULL_RTX)
2109         {
2110           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing)
2111             {
2112               temp = emit_move_insn (target ? target : product, product);
2113               set_dst_reg_note (temp,
2114                                 REG_EQUAL,
2115                                 gen_rtx_fmt_ee (MULT, mode,
2116                                                 copy_rtx (op0),
2117                                                 copy_rtx (op1)),
2118                                 target ? target : product);
2119             }
2120           return product;
2121         }
2122     }
2123
2124   /* It can't be open-coded in this mode.
2125      Use a library call if one is available and caller says that's ok.  */
2126
2127   libfunc = optab_libfunc (binoptab, mode);
2128   if (libfunc
2129       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
2130     {
2131       rtx_insn *insns;
2132       rtx op1x = op1;
2133       machine_mode op1_mode = mode;
2134       rtx value;
2135
2136       start_sequence ();
2137
2138       if (shift_optab_p (binoptab))
2139         {
2140           op1_mode = targetm.libgcc_shift_count_mode ();
2141           /* Specify unsigned here,
2142              since negative shift counts are meaningless.  */
2143           op1x = convert_to_mode (op1_mode, op1, 1);
2144         }
2145
2146       if (GET_MODE (op0) != VOIDmode
2147           && GET_MODE (op0) != mode)
2148         op0 = convert_to_mode (mode, op0, unsignedp);
2149
2150       /* Pass 1 for NO_QUEUE so we don't lose any increments
2151          if the libcall is cse'd or moved.  */
2152       value = emit_library_call_value (libfunc,
2153                                        NULL_RTX, LCT_CONST, mode, 2,
2154                                        op0, mode, op1x, op1_mode);
2155
2156       insns = get_insns ();
2157       end_sequence ();
2158
2159       target = gen_reg_rtx (mode);
2160       emit_libcall_block_1 (insns, target, value,
2161                             gen_rtx_fmt_ee (optab_to_code (binoptab),
2162                                             mode, op0, op1),
2163                             trapv_binoptab_p (binoptab));
2164
2165       return target;
2166     }
2167
2168   delete_insns_since (last);
2169
2170   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2171
2172   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
2173          || methods == OPTAB_MUST_WIDEN))
2174     {
2175       /* Caller says, don't even try.  */
2176       delete_insns_since (entry_last);
2177       return 0;
2178     }
2179
2180   /* Compute the value of METHODS to pass to recursive calls.
2181      Don't allow widening to be tried recursively.  */
2182
2183   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
2184
2185   /* Look for a wider mode of the same class for which it appears we can do
2186      the operation.  */
2187
2188   if (CLASS_HAS_WIDER_MODES_P (mclass))
2189     {
2190       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2191            wider_mode != VOIDmode;
2192            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2193         {
2194           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
2195                   != CODE_FOR_nothing
2196               || (methods == OPTAB_LIB
2197                   && optab_libfunc (binoptab, wider_mode)))
2198             {
2199               rtx xop0 = op0, xop1 = op1;
2200               int no_extend = 0;
2201
2202               /* For certain integer operations, we need not actually extend
2203                  the narrow operands, as long as we will truncate
2204                  the results to the same narrowness.  */
2205
2206               if ((binoptab == ior_optab || binoptab == and_optab
2207                    || binoptab == xor_optab
2208                    || binoptab == add_optab || binoptab == sub_optab
2209                    || binoptab == smul_optab || binoptab == ashl_optab)
2210                   && mclass == MODE_INT)
2211                 no_extend = 1;
2212
2213               xop0 = widen_operand (xop0, wider_mode, mode,
2214                                     unsignedp, no_extend);
2215
2216               /* The second operand of a shift must always be extended.  */
2217               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
2218                                     no_extend && binoptab != ashl_optab);
2219
2220               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
2221                                    unsignedp, methods);
2222               if (temp)
2223                 {
2224                   if (mclass != MODE_INT
2225                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2226                     {
2227                       if (target == 0)
2228                         target = gen_reg_rtx (mode);
2229                       convert_move (target, temp, 0);
2230                       return target;
2231                     }
2232                   else
2233                     return gen_lowpart (mode, temp);
2234                 }
2235               else
2236                 delete_insns_since (last);
2237             }
2238         }
2239     }
2240
2241   delete_insns_since (entry_last);
2242   return 0;
2243 }
2244 \f
2245 /* Expand a binary operator which has both signed and unsigned forms.
2246    UOPTAB is the optab for unsigned operations, and SOPTAB is for
2247    signed operations.
2248
2249    If we widen unsigned operands, we may use a signed wider operation instead
2250    of an unsigned wider operation, since the result would be the same.  */
2251
2252 rtx
2253 sign_expand_binop (machine_mode mode, optab uoptab, optab soptab,
2254                    rtx op0, rtx op1, rtx target, int unsignedp,
2255                    enum optab_methods methods)
2256 {
2257   rtx temp;
2258   optab direct_optab = unsignedp ? uoptab : soptab;
2259   bool save_enable;
2260
2261   /* Do it without widening, if possible.  */
2262   temp = expand_binop (mode, direct_optab, op0, op1, target,
2263                        unsignedp, OPTAB_DIRECT);
2264   if (temp || methods == OPTAB_DIRECT)
2265     return temp;
2266
2267   /* Try widening to a signed int.  Disable any direct use of any
2268      signed insn in the current mode.  */
2269   save_enable = swap_optab_enable (soptab, mode, false);
2270
2271   temp = expand_binop (mode, soptab, op0, op1, target,
2272                        unsignedp, OPTAB_WIDEN);
2273
2274   /* For unsigned operands, try widening to an unsigned int.  */
2275   if (!temp && unsignedp)
2276     temp = expand_binop (mode, uoptab, op0, op1, target,
2277                          unsignedp, OPTAB_WIDEN);
2278   if (temp || methods == OPTAB_WIDEN)
2279     goto egress;
2280
2281   /* Use the right width libcall if that exists.  */
2282   temp = expand_binop (mode, direct_optab, op0, op1, target,
2283                        unsignedp, OPTAB_LIB);
2284   if (temp || methods == OPTAB_LIB)
2285     goto egress;
2286
2287   /* Must widen and use a libcall, use either signed or unsigned.  */
2288   temp = expand_binop (mode, soptab, op0, op1, target,
2289                        unsignedp, methods);
2290   if (!temp && unsignedp)
2291     temp = expand_binop (mode, uoptab, op0, op1, target,
2292                          unsignedp, methods);
2293
2294  egress:
2295   /* Undo the fiddling above.  */
2296   if (save_enable)
2297     swap_optab_enable (soptab, mode, true);
2298   return temp;
2299 }
2300 \f
2301 /* Generate code to perform an operation specified by UNOPPTAB
2302    on operand OP0, with two results to TARG0 and TARG1.
2303    We assume that the order of the operands for the instruction
2304    is TARG0, TARG1, OP0.
2305
2306    Either TARG0 or TARG1 may be zero, but what that means is that
2307    the result is not actually wanted.  We will generate it into
2308    a dummy pseudo-reg and discard it.  They may not both be zero.
2309
2310    Returns 1 if this operation can be performed; 0 if not.  */
2311
2312 int
2313 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
2314                     int unsignedp)
2315 {
2316   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2317   enum mode_class mclass;
2318   machine_mode wider_mode;
2319   rtx_insn *entry_last = get_last_insn ();
2320   rtx_insn *last;
2321
2322   mclass = GET_MODE_CLASS (mode);
2323
2324   if (!targ0)
2325     targ0 = gen_reg_rtx (mode);
2326   if (!targ1)
2327     targ1 = gen_reg_rtx (mode);
2328
2329   /* Record where to go back to if we fail.  */
2330   last = get_last_insn ();
2331
2332   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2333     {
2334       struct expand_operand ops[3];
2335       enum insn_code icode = optab_handler (unoptab, mode);
2336
2337       create_fixed_operand (&ops[0], targ0);
2338       create_fixed_operand (&ops[1], targ1);
2339       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
2340       if (maybe_expand_insn (icode, 3, ops))
2341         return 1;
2342     }
2343
2344   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2345
2346   if (CLASS_HAS_WIDER_MODES_P (mclass))
2347     {
2348       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2349            wider_mode != VOIDmode;
2350            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2351         {
2352           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2353             {
2354               rtx t0 = gen_reg_rtx (wider_mode);
2355               rtx t1 = gen_reg_rtx (wider_mode);
2356               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2357
2358               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2359                 {
2360                   convert_move (targ0, t0, unsignedp);
2361                   convert_move (targ1, t1, unsignedp);
2362                   return 1;
2363                 }
2364               else
2365                 delete_insns_since (last);
2366             }
2367         }
2368     }
2369
2370   delete_insns_since (entry_last);
2371   return 0;
2372 }
2373 \f
2374 /* Generate code to perform an operation specified by BINOPTAB
2375    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2376    We assume that the order of the operands for the instruction
2377    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2378    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2379
2380    Either TARG0 or TARG1 may be zero, but what that means is that
2381    the result is not actually wanted.  We will generate it into
2382    a dummy pseudo-reg and discard it.  They may not both be zero.
2383
2384    Returns 1 if this operation can be performed; 0 if not.  */
2385
2386 int
2387 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2388                      int unsignedp)
2389 {
2390   machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2391   enum mode_class mclass;
2392   machine_mode wider_mode;
2393   rtx_insn *entry_last = get_last_insn ();
2394   rtx_insn *last;
2395
2396   mclass = GET_MODE_CLASS (mode);
2397
2398   if (!targ0)
2399     targ0 = gen_reg_rtx (mode);
2400   if (!targ1)
2401     targ1 = gen_reg_rtx (mode);
2402
2403   /* Record where to go back to if we fail.  */
2404   last = get_last_insn ();
2405
2406   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2407     {
2408       struct expand_operand ops[4];
2409       enum insn_code icode = optab_handler (binoptab, mode);
2410       machine_mode mode0 = insn_data[icode].operand[1].mode;
2411       machine_mode mode1 = insn_data[icode].operand[2].mode;
2412       rtx xop0 = op0, xop1 = op1;
2413
2414       /* If we are optimizing, force expensive constants into a register.  */
2415       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2416       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2417
2418       create_fixed_operand (&ops[0], targ0);
2419       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2420       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2421       create_fixed_operand (&ops[3], targ1);
2422       if (maybe_expand_insn (icode, 4, ops))
2423         return 1;
2424       delete_insns_since (last);
2425     }
2426
2427   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2428
2429   if (CLASS_HAS_WIDER_MODES_P (mclass))
2430     {
2431       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2432            wider_mode != VOIDmode;
2433            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2434         {
2435           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2436             {
2437               rtx t0 = gen_reg_rtx (wider_mode);
2438               rtx t1 = gen_reg_rtx (wider_mode);
2439               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2440               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2441
2442               if (expand_twoval_binop (binoptab, cop0, cop1,
2443                                        t0, t1, unsignedp))
2444                 {
2445                   convert_move (targ0, t0, unsignedp);
2446                   convert_move (targ1, t1, unsignedp);
2447                   return 1;
2448                 }
2449               else
2450                 delete_insns_since (last);
2451             }
2452         }
2453     }
2454
2455   delete_insns_since (entry_last);
2456   return 0;
2457 }
2458
2459 /* Expand the two-valued library call indicated by BINOPTAB, but
2460    preserve only one of the values.  If TARG0 is non-NULL, the first
2461    value is placed into TARG0; otherwise the second value is placed
2462    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2463    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2464    This routine assumes that the value returned by the library call is
2465    as if the return value was of an integral mode twice as wide as the
2466    mode of OP0.  Returns 1 if the call was successful.  */
2467
2468 bool
2469 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2470                              rtx targ0, rtx targ1, enum rtx_code code)
2471 {
2472   machine_mode mode;
2473   machine_mode libval_mode;
2474   rtx libval;
2475   rtx_insn *insns;
2476   rtx libfunc;
2477
2478   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2479   gcc_assert (!targ0 != !targ1);
2480
2481   mode = GET_MODE (op0);
2482   libfunc = optab_libfunc (binoptab, mode);
2483   if (!libfunc)
2484     return false;
2485
2486   /* The value returned by the library function will have twice as
2487      many bits as the nominal MODE.  */
2488   libval_mode = smallest_mode_for_size (2 * GET_MODE_BITSIZE (mode),
2489                                         MODE_INT);
2490   start_sequence ();
2491   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2492                                     libval_mode, 2,
2493                                     op0, mode,
2494                                     op1, mode);
2495   /* Get the part of VAL containing the value that we want.  */
2496   libval = simplify_gen_subreg (mode, libval, libval_mode,
2497                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2498   insns = get_insns ();
2499   end_sequence ();
2500   /* Move the into the desired location.  */
2501   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2502                       gen_rtx_fmt_ee (code, mode, op0, op1));
2503
2504   return true;
2505 }
2506
2507 \f
2508 /* Wrapper around expand_unop which takes an rtx code to specify
2509    the operation to perform, not an optab pointer.  All other
2510    arguments are the same.  */
2511 rtx
2512 expand_simple_unop (machine_mode mode, enum rtx_code code, rtx op0,
2513                     rtx target, int unsignedp)
2514 {
2515   optab unop = code_to_optab (code);
2516   gcc_assert (unop);
2517
2518   return expand_unop (mode, unop, op0, target, unsignedp);
2519 }
2520
2521 /* Try calculating
2522         (clz:narrow x)
2523    as
2524         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2525
2526    A similar operation can be used for clrsb.  UNOPTAB says which operation
2527    we are trying to expand.  */
2528 static rtx
2529 widen_leading (machine_mode mode, rtx op0, rtx target, optab unoptab)
2530 {
2531   enum mode_class mclass = GET_MODE_CLASS (mode);
2532   if (CLASS_HAS_WIDER_MODES_P (mclass))
2533     {
2534       machine_mode wider_mode;
2535       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2536            wider_mode != VOIDmode;
2537            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2538         {
2539           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2540             {
2541               rtx xop0, temp;
2542               rtx_insn *last;
2543
2544               last = get_last_insn ();
2545
2546               if (target == 0)
2547                 target = gen_reg_rtx (mode);
2548               xop0 = widen_operand (op0, wider_mode, mode,
2549                                     unoptab != clrsb_optab, false);
2550               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2551                                   unoptab != clrsb_optab);
2552               if (temp != 0)
2553                 temp = expand_binop
2554                   (wider_mode, sub_optab, temp,
2555                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
2556                                  - GET_MODE_PRECISION (mode),
2557                                  wider_mode),
2558                    target, true, OPTAB_DIRECT);
2559               if (temp == 0)
2560                 delete_insns_since (last);
2561
2562               return temp;
2563             }
2564         }
2565     }
2566   return 0;
2567 }
2568
2569 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2570    quantities, choosing which based on whether the high word is nonzero.  */
2571 static rtx
2572 expand_doubleword_clz (machine_mode mode, rtx op0, rtx target)
2573 {
2574   rtx xop0 = force_reg (mode, op0);
2575   rtx subhi = gen_highpart (word_mode, xop0);
2576   rtx sublo = gen_lowpart (word_mode, xop0);
2577   rtx_code_label *hi0_label = gen_label_rtx ();
2578   rtx_code_label *after_label = gen_label_rtx ();
2579   rtx_insn *seq;
2580   rtx temp, result;
2581
2582   /* If we were not given a target, use a word_mode register, not a
2583      'mode' register.  The result will fit, and nobody is expecting
2584      anything bigger (the return type of __builtin_clz* is int).  */
2585   if (!target)
2586     target = gen_reg_rtx (word_mode);
2587
2588   /* In any case, write to a word_mode scratch in both branches of the
2589      conditional, so we can ensure there is a single move insn setting
2590      'target' to tag a REG_EQUAL note on.  */
2591   result = gen_reg_rtx (word_mode);
2592
2593   start_sequence ();
2594
2595   /* If the high word is not equal to zero,
2596      then clz of the full value is clz of the high word.  */
2597   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2598                            word_mode, true, hi0_label);
2599
2600   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2601   if (!temp)
2602     goto fail;
2603
2604   if (temp != result)
2605     convert_move (result, temp, true);
2606
2607   emit_jump_insn (gen_jump (after_label));
2608   emit_barrier ();
2609
2610   /* Else clz of the full value is clz of the low word plus the number
2611      of bits in the high word.  */
2612   emit_label (hi0_label);
2613
2614   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2615   if (!temp)
2616     goto fail;
2617   temp = expand_binop (word_mode, add_optab, temp,
2618                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2619                        result, true, OPTAB_DIRECT);
2620   if (!temp)
2621     goto fail;
2622   if (temp != result)
2623     convert_move (result, temp, true);
2624
2625   emit_label (after_label);
2626   convert_move (target, result, true);
2627
2628   seq = get_insns ();
2629   end_sequence ();
2630
2631   add_equal_note (seq, target, CLZ, xop0, 0);
2632   emit_insn (seq);
2633   return target;
2634
2635  fail:
2636   end_sequence ();
2637   return 0;
2638 }
2639
2640 /* Try calculating
2641         (bswap:narrow x)
2642    as
2643         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2644 static rtx
2645 widen_bswap (machine_mode mode, rtx op0, rtx target)
2646 {
2647   enum mode_class mclass = GET_MODE_CLASS (mode);
2648   machine_mode wider_mode;
2649   rtx x;
2650   rtx_insn *last;
2651
2652   if (!CLASS_HAS_WIDER_MODES_P (mclass))
2653     return NULL_RTX;
2654
2655   for (wider_mode = GET_MODE_WIDER_MODE (mode);
2656        wider_mode != VOIDmode;
2657        wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2658     if (optab_handler (bswap_optab, wider_mode) != CODE_FOR_nothing)
2659       goto found;
2660   return NULL_RTX;
2661
2662  found:
2663   last = get_last_insn ();
2664
2665   x = widen_operand (op0, wider_mode, mode, true, true);
2666   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2667
2668   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2669               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2670   if (x != 0)
2671     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2672                       GET_MODE_BITSIZE (wider_mode)
2673                       - GET_MODE_BITSIZE (mode),
2674                       NULL_RTX, true);
2675
2676   if (x != 0)
2677     {
2678       if (target == 0)
2679         target = gen_reg_rtx (mode);
2680       emit_move_insn (target, gen_lowpart (mode, x));
2681     }
2682   else
2683     delete_insns_since (last);
2684
2685   return target;
2686 }
2687
2688 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2689
2690 static rtx
2691 expand_doubleword_bswap (machine_mode mode, rtx op, rtx target)
2692 {
2693   rtx t0, t1;
2694
2695   t1 = expand_unop (word_mode, bswap_optab,
2696                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2697   t0 = expand_unop (word_mode, bswap_optab,
2698                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2699
2700   if (target == 0 || !valid_multiword_target_p (target))
2701     target = gen_reg_rtx (mode);
2702   if (REG_P (target))
2703     emit_clobber (target);
2704   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2705   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2706
2707   return target;
2708 }
2709
2710 /* Try calculating (parity x) as (and (popcount x) 1), where
2711    popcount can also be done in a wider mode.  */
2712 static rtx
2713 expand_parity (machine_mode mode, rtx op0, rtx target)
2714 {
2715   enum mode_class mclass = GET_MODE_CLASS (mode);
2716   if (CLASS_HAS_WIDER_MODES_P (mclass))
2717     {
2718       machine_mode wider_mode;
2719       for (wider_mode = mode; wider_mode != VOIDmode;
2720            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2721         {
2722           if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2723             {
2724               rtx xop0, temp;
2725               rtx_insn *last;
2726
2727               last = get_last_insn ();
2728
2729               if (target == 0)
2730                 target = gen_reg_rtx (mode);
2731               xop0 = widen_operand (op0, wider_mode, mode, true, false);
2732               temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2733                                   true);
2734               if (temp != 0)
2735                 temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2736                                      target, true, OPTAB_DIRECT);
2737               if (temp == 0)
2738                 delete_insns_since (last);
2739
2740               return temp;
2741             }
2742         }
2743     }
2744   return 0;
2745 }
2746
2747 /* Try calculating ctz(x) as K - clz(x & -x) ,
2748    where K is GET_MODE_PRECISION(mode) - 1.
2749
2750    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2751    don't have to worry about what the hardware does in that case.  (If
2752    the clz instruction produces the usual value at 0, which is K, the
2753    result of this code sequence will be -1; expand_ffs, below, relies
2754    on this.  It might be nice to have it be K instead, for consistency
2755    with the (very few) processors that provide a ctz with a defined
2756    value, but that would take one more instruction, and it would be
2757    less convenient for expand_ffs anyway.  */
2758
2759 static rtx
2760 expand_ctz (machine_mode mode, rtx op0, rtx target)
2761 {
2762   rtx_insn *seq;
2763   rtx temp;
2764
2765   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2766     return 0;
2767
2768   start_sequence ();
2769
2770   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2771   if (temp)
2772     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2773                          true, OPTAB_DIRECT);
2774   if (temp)
2775     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2776   if (temp)
2777     temp = expand_binop (mode, sub_optab,
2778                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2779                          temp, target,
2780                          true, OPTAB_DIRECT);
2781   if (temp == 0)
2782     {
2783       end_sequence ();
2784       return 0;
2785     }
2786
2787   seq = get_insns ();
2788   end_sequence ();
2789
2790   add_equal_note (seq, temp, CTZ, op0, 0);
2791   emit_insn (seq);
2792   return temp;
2793 }
2794
2795
2796 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2797    else with the sequence used by expand_clz.
2798
2799    The ffs builtin promises to return zero for a zero value and ctz/clz
2800    may have an undefined value in that case.  If they do not give us a
2801    convenient value, we have to generate a test and branch.  */
2802 static rtx
2803 expand_ffs (machine_mode mode, rtx op0, rtx target)
2804 {
2805   HOST_WIDE_INT val = 0;
2806   bool defined_at_zero = false;
2807   rtx temp;
2808   rtx_insn *seq;
2809
2810   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2811     {
2812       start_sequence ();
2813
2814       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2815       if (!temp)
2816         goto fail;
2817
2818       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2819     }
2820   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2821     {
2822       start_sequence ();
2823       temp = expand_ctz (mode, op0, 0);
2824       if (!temp)
2825         goto fail;
2826
2827       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2828         {
2829           defined_at_zero = true;
2830           val = (GET_MODE_PRECISION (mode) - 1) - val;
2831         }
2832     }
2833   else
2834     return 0;
2835
2836   if (defined_at_zero && val == -1)
2837     /* No correction needed at zero.  */;
2838   else
2839     {
2840       /* We don't try to do anything clever with the situation found
2841          on some processors (eg Alpha) where ctz(0:mode) ==
2842          bitsize(mode).  If someone can think of a way to send N to -1
2843          and leave alone all values in the range 0..N-1 (where N is a
2844          power of two), cheaper than this test-and-branch, please add it.
2845
2846          The test-and-branch is done after the operation itself, in case
2847          the operation sets condition codes that can be recycled for this.
2848          (This is true on i386, for instance.)  */
2849
2850       rtx_code_label *nonzero_label = gen_label_rtx ();
2851       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2852                                mode, true, nonzero_label);
2853
2854       convert_move (temp, GEN_INT (-1), false);
2855       emit_label (nonzero_label);
2856     }
2857
2858   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2859      to produce a value in the range 0..bitsize.  */
2860   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2861                        target, false, OPTAB_DIRECT);
2862   if (!temp)
2863     goto fail;
2864
2865   seq = get_insns ();
2866   end_sequence ();
2867
2868   add_equal_note (seq, temp, FFS, op0, 0);
2869   emit_insn (seq);
2870   return temp;
2871
2872  fail:
2873   end_sequence ();
2874   return 0;
2875 }
2876
2877 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2878    conditions, VAL may already be a SUBREG against which we cannot generate
2879    a further SUBREG.  In this case, we expect forcing the value into a
2880    register will work around the situation.  */
2881
2882 static rtx
2883 lowpart_subreg_maybe_copy (machine_mode omode, rtx val,
2884                            machine_mode imode)
2885 {
2886   rtx ret;
2887   ret = lowpart_subreg (omode, val, imode);
2888   if (ret == NULL)
2889     {
2890       val = force_reg (imode, val);
2891       ret = lowpart_subreg (omode, val, imode);
2892       gcc_assert (ret != NULL);
2893     }
2894   return ret;
2895 }
2896
2897 /* Expand a floating point absolute value or negation operation via a
2898    logical operation on the sign bit.  */
2899
2900 static rtx
2901 expand_absneg_bit (enum rtx_code code, machine_mode mode,
2902                    rtx op0, rtx target)
2903 {
2904   const struct real_format *fmt;
2905   int bitpos, word, nwords, i;
2906   machine_mode imode;
2907   rtx temp;
2908   rtx_insn *insns;
2909
2910   /* The format has to have a simple sign bit.  */
2911   fmt = REAL_MODE_FORMAT (mode);
2912   if (fmt == NULL)
2913     return NULL_RTX;
2914
2915   bitpos = fmt->signbit_rw;
2916   if (bitpos < 0)
2917     return NULL_RTX;
2918
2919   /* Don't create negative zeros if the format doesn't support them.  */
2920   if (code == NEG && !fmt->has_signed_zero)
2921     return NULL_RTX;
2922
2923   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2924     {
2925       imode = int_mode_for_mode (mode);
2926       if (imode == BLKmode)
2927         return NULL_RTX;
2928       word = 0;
2929       nwords = 1;
2930     }
2931   else
2932     {
2933       imode = word_mode;
2934
2935       if (FLOAT_WORDS_BIG_ENDIAN)
2936         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2937       else
2938         word = bitpos / BITS_PER_WORD;
2939       bitpos = bitpos % BITS_PER_WORD;
2940       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2941     }
2942
2943   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2944   if (code == ABS)
2945     mask = ~mask;
2946
2947   if (target == 0
2948       || target == op0
2949       || (nwords > 1 && !valid_multiword_target_p (target)))
2950     target = gen_reg_rtx (mode);
2951
2952   if (nwords > 1)
2953     {
2954       start_sequence ();
2955
2956       for (i = 0; i < nwords; ++i)
2957         {
2958           rtx targ_piece = operand_subword (target, i, 1, mode);
2959           rtx op0_piece = operand_subword_force (op0, i, mode);
2960
2961           if (i == word)
2962             {
2963               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2964                                    op0_piece,
2965                                    immed_wide_int_const (mask, imode),
2966                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2967               if (temp != targ_piece)
2968                 emit_move_insn (targ_piece, temp);
2969             }
2970           else
2971             emit_move_insn (targ_piece, op0_piece);
2972         }
2973
2974       insns = get_insns ();
2975       end_sequence ();
2976
2977       emit_insn (insns);
2978     }
2979   else
2980     {
2981       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2982                            gen_lowpart (imode, op0),
2983                            immed_wide_int_const (mask, imode),
2984                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2985       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2986
2987       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2988                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2989                         target);
2990     }
2991
2992   return target;
2993 }
2994
2995 /* As expand_unop, but will fail rather than attempt the operation in a
2996    different mode or with a libcall.  */
2997 static rtx
2998 expand_unop_direct (machine_mode mode, optab unoptab, rtx op0, rtx target,
2999              int unsignedp)
3000 {
3001   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
3002     {
3003       struct expand_operand ops[2];
3004       enum insn_code icode = optab_handler (unoptab, mode);
3005       rtx_insn *last = get_last_insn ();
3006       rtx_insn *pat;
3007
3008       create_output_operand (&ops[0], target, mode);
3009       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
3010       pat = maybe_gen_insn (icode, 2, ops);
3011       if (pat)
3012         {
3013           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3014               && ! add_equal_note (pat, ops[0].value,
3015                                    optab_to_code (unoptab),
3016                                    ops[1].value, NULL_RTX))
3017             {
3018               delete_insns_since (last);
3019               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
3020             }
3021
3022           emit_insn (pat);
3023
3024           return ops[0].value;
3025         }
3026     }
3027   return 0;
3028 }
3029
3030 /* Generate code to perform an operation specified by UNOPTAB
3031    on operand OP0, with result having machine-mode MODE.
3032
3033    UNSIGNEDP is for the case where we have to widen the operands
3034    to perform the operation.  It says to use zero-extension.
3035
3036    If TARGET is nonzero, the value
3037    is generated there, if it is convenient to do so.
3038    In all cases an rtx is returned for the locus of the value;
3039    this may or may not be TARGET.  */
3040
3041 rtx
3042 expand_unop (machine_mode mode, optab unoptab, rtx op0, rtx target,
3043              int unsignedp)
3044 {
3045   enum mode_class mclass = GET_MODE_CLASS (mode);
3046   machine_mode wider_mode;
3047   rtx temp;
3048   rtx libfunc;
3049
3050   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
3051   if (temp)
3052     return temp;
3053
3054   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
3055
3056   /* Widening (or narrowing) clz needs special treatment.  */
3057   if (unoptab == clz_optab)
3058     {
3059       temp = widen_leading (mode, op0, target, unoptab);
3060       if (temp)
3061         return temp;
3062
3063       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3064           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3065         {
3066           temp = expand_doubleword_clz (mode, op0, target);
3067           if (temp)
3068             return temp;
3069         }
3070
3071       goto try_libcall;
3072     }
3073
3074   if (unoptab == clrsb_optab)
3075     {
3076       temp = widen_leading (mode, op0, target, unoptab);
3077       if (temp)
3078         return temp;
3079       goto try_libcall;
3080     }
3081
3082   /* Widening (or narrowing) bswap needs special treatment.  */
3083   if (unoptab == bswap_optab)
3084     {
3085       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
3086          or ROTATERT.  First try these directly; if this fails, then try the
3087          obvious pair of shifts with allowed widening, as this will probably
3088          be always more efficient than the other fallback methods.  */
3089       if (mode == HImode)
3090         {
3091           rtx_insn *last;
3092           rtx temp1, temp2;
3093
3094           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
3095             {
3096               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
3097                                    unsignedp, OPTAB_DIRECT);
3098               if (temp)
3099                 return temp;
3100              }
3101
3102           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
3103             {
3104               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
3105                                    unsignedp, OPTAB_DIRECT);
3106               if (temp)
3107                 return temp;
3108             }
3109
3110           last = get_last_insn ();
3111
3112           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
3113                                 unsignedp, OPTAB_WIDEN);
3114           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
3115                                 unsignedp, OPTAB_WIDEN);
3116           if (temp1 && temp2)
3117             {
3118               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
3119                                    unsignedp, OPTAB_WIDEN);
3120               if (temp)
3121                 return temp;
3122             }
3123
3124           delete_insns_since (last);
3125         }
3126
3127       temp = widen_bswap (mode, op0, target);
3128       if (temp)
3129         return temp;
3130
3131       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3132           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3133         {
3134           temp = expand_doubleword_bswap (mode, op0, target);
3135           if (temp)
3136             return temp;
3137         }
3138
3139       goto try_libcall;
3140     }
3141
3142   if (CLASS_HAS_WIDER_MODES_P (mclass))
3143     for (wider_mode = GET_MODE_WIDER_MODE (mode);
3144          wider_mode != VOIDmode;
3145          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3146       {
3147         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
3148           {
3149             rtx xop0 = op0;
3150             rtx_insn *last = get_last_insn ();
3151
3152             /* For certain operations, we need not actually extend
3153                the narrow operand, as long as we will truncate the
3154                results to the same narrowness.  */
3155
3156             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3157                                   (unoptab == neg_optab
3158                                    || unoptab == one_cmpl_optab)
3159                                   && mclass == MODE_INT);
3160
3161             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3162                                 unsignedp);
3163
3164             if (temp)
3165               {
3166                 if (mclass != MODE_INT
3167                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
3168                   {
3169                     if (target == 0)
3170                       target = gen_reg_rtx (mode);
3171                     convert_move (target, temp, 0);
3172                     return target;
3173                   }
3174                 else
3175                   return gen_lowpart (mode, temp);
3176               }
3177             else
3178               delete_insns_since (last);
3179           }
3180       }
3181
3182   /* These can be done a word at a time.  */
3183   if (unoptab == one_cmpl_optab
3184       && mclass == MODE_INT
3185       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
3186       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3187     {
3188       int i;
3189       rtx_insn *insns;
3190
3191       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
3192         target = gen_reg_rtx (mode);
3193
3194       start_sequence ();
3195
3196       /* Do the actual arithmetic.  */
3197       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
3198         {
3199           rtx target_piece = operand_subword (target, i, 1, mode);
3200           rtx x = expand_unop (word_mode, unoptab,
3201                                operand_subword_force (op0, i, mode),
3202                                target_piece, unsignedp);
3203
3204           if (target_piece != x)
3205             emit_move_insn (target_piece, x);
3206         }
3207
3208       insns = get_insns ();
3209       end_sequence ();
3210
3211       emit_insn (insns);
3212       return target;
3213     }
3214
3215   if (optab_to_code (unoptab) == NEG)
3216     {
3217       /* Try negating floating point values by flipping the sign bit.  */
3218       if (SCALAR_FLOAT_MODE_P (mode))
3219         {
3220           temp = expand_absneg_bit (NEG, mode, op0, target);
3221           if (temp)
3222             return temp;
3223         }
3224
3225       /* If there is no negation pattern, and we have no negative zero,
3226          try subtracting from zero.  */
3227       if (!HONOR_SIGNED_ZEROS (mode))
3228         {
3229           temp = expand_binop (mode, (unoptab == negv_optab
3230                                       ? subv_optab : sub_optab),
3231                                CONST0_RTX (mode), op0, target,
3232                                unsignedp, OPTAB_DIRECT);
3233           if (temp)
3234             return temp;
3235         }
3236     }
3237
3238   /* Try calculating parity (x) as popcount (x) % 2.  */
3239   if (unoptab == parity_optab)
3240     {
3241       temp = expand_parity (mode, op0, target);
3242       if (temp)
3243         return temp;
3244     }
3245
3246   /* Try implementing ffs (x) in terms of clz (x).  */
3247   if (unoptab == ffs_optab)
3248     {
3249       temp = expand_ffs (mode, op0, target);
3250       if (temp)
3251         return temp;
3252     }
3253
3254   /* Try implementing ctz (x) in terms of clz (x).  */
3255   if (unoptab == ctz_optab)
3256     {
3257       temp = expand_ctz (mode, op0, target);
3258       if (temp)
3259         return temp;
3260     }
3261
3262  try_libcall:
3263   /* Now try a library call in this mode.  */
3264   libfunc = optab_libfunc (unoptab, mode);
3265   if (libfunc)
3266     {
3267       rtx_insn *insns;
3268       rtx value;
3269       rtx eq_value;
3270       machine_mode outmode = mode;
3271
3272       /* All of these functions return small values.  Thus we choose to
3273          have them return something that isn't a double-word.  */
3274       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3275           || unoptab == clrsb_optab || unoptab == popcount_optab
3276           || unoptab == parity_optab)
3277         outmode
3278           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3279                                           optab_libfunc (unoptab, mode)));
3280
3281       start_sequence ();
3282
3283       /* Pass 1 for NO_QUEUE so we don't lose any increments
3284          if the libcall is cse'd or moved.  */
3285       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3286                                        1, op0, mode);
3287       insns = get_insns ();
3288       end_sequence ();
3289
3290       target = gen_reg_rtx (outmode);
3291       eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3292       if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
3293         eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3294       else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
3295         eq_value = simplify_gen_unary (ZERO_EXTEND, outmode, eq_value, mode);
3296       emit_libcall_block_1 (insns, target, value, eq_value,
3297                             trapv_unoptab_p (unoptab));
3298
3299       return target;
3300     }
3301
3302   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3303
3304   if (CLASS_HAS_WIDER_MODES_P (mclass))
3305     {
3306       for (wider_mode = GET_MODE_WIDER_MODE (mode);
3307            wider_mode != VOIDmode;
3308            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3309         {
3310           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3311               || optab_libfunc (unoptab, wider_mode))
3312             {
3313               rtx xop0 = op0;
3314               rtx_insn *last = get_last_insn ();
3315
3316               /* For certain operations, we need not actually extend
3317                  the narrow operand, as long as we will truncate the
3318                  results to the same narrowness.  */
3319               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3320                                     (unoptab == neg_optab
3321                                      || unoptab == one_cmpl_optab
3322                                      || unoptab == bswap_optab)
3323                                     && mclass == MODE_INT);
3324
3325               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3326                                   unsignedp);
3327
3328               /* If we are generating clz using wider mode, adjust the
3329                  result.  Similarly for clrsb.  */
3330               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3331                   && temp != 0)
3332                 temp = expand_binop
3333                   (wider_mode, sub_optab, temp,
3334                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
3335                                  - GET_MODE_PRECISION (mode),
3336                                  wider_mode),
3337                    target, true, OPTAB_DIRECT);
3338
3339               /* Likewise for bswap.  */
3340               if (unoptab == bswap_optab && temp != 0)
3341                 {
3342                   gcc_assert (GET_MODE_PRECISION (wider_mode)
3343                               == GET_MODE_BITSIZE (wider_mode)
3344                               && GET_MODE_PRECISION (mode)
3345                                  == GET_MODE_BITSIZE (mode));
3346
3347                   temp = expand_shift (RSHIFT_EXPR, wider_mode, temp,
3348                                        GET_MODE_BITSIZE (wider_mode)
3349                                        - GET_MODE_BITSIZE (mode),
3350                                        NULL_RTX, true);
3351                 }
3352
3353               if (temp)
3354                 {
3355                   if (mclass != MODE_INT)
3356                     {
3357                       if (target == 0)
3358                         target = gen_reg_rtx (mode);
3359                       convert_move (target, temp, 0);
3360                       return target;
3361                     }
3362                   else
3363                     return gen_lowpart (mode, temp);
3364                 }
3365               else
3366                 delete_insns_since (last);
3367             }
3368         }
3369     }
3370
3371   /* One final attempt at implementing negation via subtraction,
3372      this time allowing widening of the operand.  */
3373   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3374     {
3375       rtx temp;
3376       temp = expand_binop (mode,
3377                            unoptab == negv_optab ? subv_optab : sub_optab,
3378                            CONST0_RTX (mode), op0,
3379                            target, unsignedp, OPTAB_LIB_WIDEN);
3380       if (temp)
3381         return temp;
3382     }
3383
3384   return 0;
3385 }
3386 \f
3387 /* Emit code to compute the absolute value of OP0, with result to
3388    TARGET if convenient.  (TARGET may be 0.)  The return value says
3389    where the result actually is to be found.
3390
3391    MODE is the mode of the operand; the mode of the result is
3392    different but can be deduced from MODE.
3393
3394  */
3395
3396 rtx
3397 expand_abs_nojump (machine_mode mode, rtx op0, rtx target,
3398                    int result_unsignedp)
3399 {
3400   rtx temp;
3401
3402   if (GET_MODE_CLASS (mode) != MODE_INT
3403       || ! flag_trapv)
3404     result_unsignedp = 1;
3405
3406   /* First try to do it with a special abs instruction.  */
3407   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3408                       op0, target, 0);
3409   if (temp != 0)
3410     return temp;
3411
3412   /* For floating point modes, try clearing the sign bit.  */
3413   if (SCALAR_FLOAT_MODE_P (mode))
3414     {
3415       temp = expand_absneg_bit (ABS, mode, op0, target);
3416       if (temp)
3417         return temp;
3418     }
3419
3420   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3421   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3422       && !HONOR_SIGNED_ZEROS (mode))
3423     {
3424       rtx_insn *last = get_last_insn ();
3425
3426       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3427                           op0, NULL_RTX, 0);
3428       if (temp != 0)
3429         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3430                              OPTAB_WIDEN);
3431
3432       if (temp != 0)
3433         return temp;
3434
3435       delete_insns_since (last);
3436     }
3437
3438   /* If this machine has expensive jumps, we can do integer absolute
3439      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3440      where W is the width of MODE.  */
3441
3442   if (GET_MODE_CLASS (mode) == MODE_INT
3443       && BRANCH_COST (optimize_insn_for_speed_p (),
3444                       false) >= 2)
3445     {
3446       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3447                                    GET_MODE_PRECISION (mode) - 1,
3448                                    NULL_RTX, 0);
3449
3450       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3451                            OPTAB_LIB_WIDEN);
3452       if (temp != 0)
3453         temp = expand_binop (mode, result_unsignedp ? sub_optab : subv_optab,
3454                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3455
3456       if (temp != 0)
3457         return temp;
3458     }
3459
3460   return NULL_RTX;
3461 }
3462
3463 rtx
3464 expand_abs (machine_mode mode, rtx op0, rtx target,
3465             int result_unsignedp, int safe)
3466 {
3467   rtx temp;
3468   rtx_code_label *op1;
3469
3470   if (GET_MODE_CLASS (mode) != MODE_INT
3471       || ! flag_trapv)
3472     result_unsignedp = 1;
3473
3474   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3475   if (temp != 0)
3476     return temp;
3477
3478   /* If that does not win, use conditional jump and negate.  */
3479
3480   /* It is safe to use the target if it is the same
3481      as the source if this is also a pseudo register */
3482   if (op0 == target && REG_P (op0)
3483       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3484     safe = 1;
3485
3486   op1 = gen_label_rtx ();
3487   if (target == 0 || ! safe
3488       || GET_MODE (target) != mode
3489       || (MEM_P (target) && MEM_VOLATILE_P (target))
3490       || (REG_P (target)
3491           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3492     target = gen_reg_rtx (mode);
3493
3494   emit_move_insn (target, op0);
3495   NO_DEFER_POP;
3496
3497   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3498                            NULL_RTX, NULL, op1, -1);
3499
3500   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3501                      target, target, 0);
3502   if (op0 != target)
3503     emit_move_insn (target, op0);
3504   emit_label (op1);
3505   OK_DEFER_POP;
3506   return target;
3507 }
3508
3509 /* Emit code to compute the one's complement absolute value of OP0
3510    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3511    (TARGET may be NULL_RTX.)  The return value says where the result
3512    actually is to be found.
3513
3514    MODE is the mode of the operand; the mode of the result is
3515    different but can be deduced from MODE.  */
3516
3517 rtx
3518 expand_one_cmpl_abs_nojump (machine_mode mode, rtx op0, rtx target)
3519 {
3520   rtx temp;
3521
3522   /* Not applicable for floating point modes.  */
3523   if (FLOAT_MODE_P (mode))
3524     return NULL_RTX;
3525
3526   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3527   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3528     {
3529       rtx_insn *last = get_last_insn ();
3530
3531       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3532       if (temp != 0)
3533         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3534                              OPTAB_WIDEN);
3535
3536       if (temp != 0)
3537         return temp;
3538
3539       delete_insns_since (last);
3540     }
3541
3542   /* If this machine has expensive jumps, we can do one's complement
3543      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3544
3545   if (GET_MODE_CLASS (mode) == MODE_INT
3546       && BRANCH_COST (optimize_insn_for_speed_p (),
3547                      false) >= 2)
3548     {
3549       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3550                                    GET_MODE_PRECISION (mode) - 1,
3551                                    NULL_RTX, 0);
3552
3553       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3554                            OPTAB_LIB_WIDEN);
3555
3556       if (temp != 0)
3557         return temp;
3558     }
3559
3560   return NULL_RTX;
3561 }
3562
3563 /* A subroutine of expand_copysign, perform the copysign operation using the
3564    abs and neg primitives advertised to exist on the target.  The assumption
3565    is that we have a split register file, and leaving op0 in fp registers,
3566    and not playing with subregs so much, will help the register allocator.  */
3567
3568 static rtx
3569 expand_copysign_absneg (machine_mode mode, rtx op0, rtx op1, rtx target,
3570                         int bitpos, bool op0_is_abs)
3571 {
3572   machine_mode imode;
3573   enum insn_code icode;
3574   rtx sign;
3575   rtx_code_label *label;
3576
3577   if (target == op1)
3578     target = NULL_RTX;
3579
3580   /* Check if the back end provides an insn that handles signbit for the
3581      argument's mode. */
3582   icode = optab_handler (signbit_optab, mode);
3583   if (icode != CODE_FOR_nothing)
3584     {
3585       imode = insn_data[(int) icode].operand[0].mode;
3586       sign = gen_reg_rtx (imode);
3587       emit_unop_insn (icode, sign, op1, UNKNOWN);
3588     }
3589   else
3590     {
3591       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3592         {
3593           imode = int_mode_for_mode (mode);
3594           if (imode == BLKmode)
3595             return NULL_RTX;
3596           op1 = gen_lowpart (imode, op1);
3597         }
3598       else
3599         {
3600           int word;
3601
3602           imode = word_mode;
3603           if (FLOAT_WORDS_BIG_ENDIAN)
3604             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3605           else
3606             word = bitpos / BITS_PER_WORD;
3607           bitpos = bitpos % BITS_PER_WORD;
3608           op1 = operand_subword_force (op1, word, mode);
3609         }
3610
3611       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3612       sign = expand_binop (imode, and_optab, op1,
3613                            immed_wide_int_const (mask, imode),
3614                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3615     }
3616
3617   if (!op0_is_abs)
3618     {
3619       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3620       if (op0 == NULL)
3621         return NULL_RTX;
3622       target = op0;
3623     }
3624   else
3625     {
3626       if (target == NULL_RTX)
3627         target = copy_to_reg (op0);
3628       else
3629         emit_move_insn (target, op0);
3630     }
3631
3632   label = gen_label_rtx ();
3633   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3634
3635   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3636     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3637   else
3638     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3639   if (op0 != target)
3640     emit_move_insn (target, op0);
3641
3642   emit_label (label);
3643
3644   return target;
3645 }
3646
3647
3648 /* A subroutine of expand_copysign, perform the entire copysign operation
3649    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3650    is true if op0 is known to have its sign bit clear.  */
3651
3652 static rtx
3653 expand_copysign_bit (machine_mode mode, rtx op0, rtx op1, rtx target,
3654                      int bitpos, bool op0_is_abs)
3655 {
3656   machine_mode imode;
3657   int word, nwords, i;
3658   rtx temp;
3659   rtx_insn *insns;
3660
3661   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3662     {
3663       imode = int_mode_for_mode (mode);
3664       if (imode == BLKmode)
3665         return NULL_RTX;
3666       word = 0;
3667       nwords = 1;
3668     }
3669   else
3670     {
3671       imode = word_mode;
3672
3673       if (FLOAT_WORDS_BIG_ENDIAN)
3674         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3675       else
3676         word = bitpos / BITS_PER_WORD;
3677       bitpos = bitpos % BITS_PER_WORD;
3678       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3679     }
3680
3681   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3682
3683   if (target == 0
3684       || target == op0
3685       || target == op1
3686       || (nwords > 1 && !valid_multiword_target_p (target)))
3687     target = gen_reg_rtx (mode);
3688
3689   if (nwords > 1)
3690     {
3691       start_sequence ();
3692
3693       for (i = 0; i < nwords; ++i)
3694         {
3695           rtx targ_piece = operand_subword (target, i, 1, mode);
3696           rtx op0_piece = operand_subword_force (op0, i, mode);
3697
3698           if (i == word)
3699             {
3700               if (!op0_is_abs)
3701                 op0_piece
3702                   = expand_binop (imode, and_optab, op0_piece,
3703                                   immed_wide_int_const (~mask, imode),
3704                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3705               op1 = expand_binop (imode, and_optab,
3706                                   operand_subword_force (op1, i, mode),
3707                                   immed_wide_int_const (mask, imode),
3708                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3709
3710               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3711                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3712               if (temp != targ_piece)
3713                 emit_move_insn (targ_piece, temp);
3714             }
3715           else
3716             emit_move_insn (targ_piece, op0_piece);
3717         }
3718
3719       insns = get_insns ();
3720       end_sequence ();
3721
3722       emit_insn (insns);
3723     }
3724   else
3725     {
3726       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3727                           immed_wide_int_const (mask, imode),
3728                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3729
3730       op0 = gen_lowpart (imode, op0);
3731       if (!op0_is_abs)
3732         op0 = expand_binop (imode, and_optab, op0,
3733                             immed_wide_int_const (~mask, imode),
3734                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3735
3736       temp = expand_binop (imode, ior_optab, op0, op1,
3737                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3738       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3739     }
3740
3741   return target;
3742 }
3743
3744 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3745    scalar floating point mode.  Return NULL if we do not know how to
3746    expand the operation inline.  */
3747
3748 rtx
3749 expand_copysign (rtx op0, rtx op1, rtx target)
3750 {
3751   machine_mode mode = GET_MODE (op0);
3752   const struct real_format *fmt;
3753   bool op0_is_abs;
3754   rtx temp;
3755
3756   gcc_assert (SCALAR_FLOAT_MODE_P (mode));
3757   gcc_assert (GET_MODE (op1) == mode);
3758
3759   /* First try to do it with a special instruction.  */
3760   temp = expand_binop (mode, copysign_optab, op0, op1,
3761                        target, 0, OPTAB_DIRECT);
3762   if (temp)
3763     return temp;
3764
3765   fmt = REAL_MODE_FORMAT (mode);
3766   if (fmt == NULL || !fmt->has_signed_zero)
3767     return NULL_RTX;
3768
3769   op0_is_abs = false;
3770   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3771     {
3772       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3773         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3774       op0_is_abs = true;
3775     }
3776
3777   if (fmt->signbit_ro >= 0
3778       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3779           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3780               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3781     {
3782       temp = expand_copysign_absneg (mode, op0, op1, target,
3783                                      fmt->signbit_ro, op0_is_abs);
3784       if (temp)
3785         return temp;
3786     }
3787
3788   if (fmt->signbit_rw < 0)
3789     return NULL_RTX;
3790   return expand_copysign_bit (mode, op0, op1, target,
3791                               fmt->signbit_rw, op0_is_abs);
3792 }
3793 \f
3794 /* Generate an instruction whose insn-code is INSN_CODE,
3795    with two operands: an output TARGET and an input OP0.
3796    TARGET *must* be nonzero, and the output is always stored there.
3797    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3798    the value that is stored into TARGET.
3799
3800    Return false if expansion failed.  */
3801
3802 bool
3803 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3804                       enum rtx_code code)
3805 {
3806   struct expand_operand ops[2];
3807   rtx_insn *pat;
3808
3809   create_output_operand (&ops[0], target, GET_MODE (target));
3810   create_input_operand (&ops[1], op0, GET_MODE (op0));
3811   pat = maybe_gen_insn (icode, 2, ops);
3812   if (!pat)
3813     return false;
3814
3815   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3816       && code != UNKNOWN)
3817     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3818
3819   emit_insn (pat);
3820
3821   if (ops[0].value != target)
3822     emit_move_insn (target, ops[0].value);
3823   return true;
3824 }
3825 /* Generate an instruction whose insn-code is INSN_CODE,
3826    with two operands: an output TARGET and an input OP0.
3827    TARGET *must* be nonzero, and the output is always stored there.
3828    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3829    the value that is stored into TARGET.  */
3830
3831 void
3832 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3833 {
3834   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3835   gcc_assert (ok);
3836 }
3837 \f
3838 struct no_conflict_data
3839 {
3840   rtx target;
3841   rtx_insn *first, *insn;
3842   bool must_stay;
3843 };
3844
3845 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3846    the currently examined clobber / store has to stay in the list of
3847    insns that constitute the actual libcall block.  */
3848 static void
3849 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3850 {
3851   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3852
3853   /* If this inns directly contributes to setting the target, it must stay.  */
3854   if (reg_overlap_mentioned_p (p->target, dest))
3855     p->must_stay = true;
3856   /* If we haven't committed to keeping any other insns in the list yet,
3857      there is nothing more to check.  */
3858   else if (p->insn == p->first)
3859     return;
3860   /* If this insn sets / clobbers a register that feeds one of the insns
3861      already in the list, this insn has to stay too.  */
3862   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3863            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3864            || reg_used_between_p (dest, p->first, p->insn)
3865            /* Likewise if this insn depends on a register set by a previous
3866               insn in the list, or if it sets a result (presumably a hard
3867               register) that is set or clobbered by a previous insn.
3868               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3869               SET_DEST perform the former check on the address, and the latter
3870               check on the MEM.  */
3871            || (GET_CODE (set) == SET
3872                && (modified_in_p (SET_SRC (set), p->first)
3873                    || modified_in_p (SET_DEST (set), p->first)
3874                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3875                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3876     p->must_stay = true;
3877 }
3878
3879 \f
3880 /* Emit code to make a call to a constant function or a library call.
3881
3882    INSNS is a list containing all insns emitted in the call.
3883    These insns leave the result in RESULT.  Our block is to copy RESULT
3884    to TARGET, which is logically equivalent to EQUIV.
3885
3886    We first emit any insns that set a pseudo on the assumption that these are
3887    loading constants into registers; doing so allows them to be safely cse'ed
3888    between blocks.  Then we emit all the other insns in the block, followed by
3889    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3890    note with an operand of EQUIV.  */
3891
3892 static void
3893 emit_libcall_block_1 (rtx_insn *insns, rtx target, rtx result, rtx equiv,
3894                       bool equiv_may_trap)
3895 {
3896   rtx final_dest = target;
3897   rtx_insn *next, *last, *insn;
3898
3899   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3900      into a MEM later.  Protect the libcall block from this change.  */
3901   if (! REG_P (target) || REG_USERVAR_P (target))
3902     target = gen_reg_rtx (GET_MODE (target));
3903
3904   /* If we're using non-call exceptions, a libcall corresponding to an
3905      operation that may trap may also trap.  */
3906   /* ??? See the comment in front of make_reg_eh_region_note.  */
3907   if (cfun->can_throw_non_call_exceptions
3908       && (equiv_may_trap || may_trap_p (equiv)))
3909     {
3910       for (insn = insns; insn; insn = NEXT_INSN (insn))
3911         if (CALL_P (insn))
3912           {
3913             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3914             if (note)
3915               {
3916                 int lp_nr = INTVAL (XEXP (note, 0));
3917                 if (lp_nr == 0 || lp_nr == INT_MIN)
3918                   remove_note (insn, note);
3919               }
3920           }
3921     }
3922   else
3923     {
3924       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3925          reg note to indicate that this call cannot throw or execute a nonlocal
3926          goto (unless there is already a REG_EH_REGION note, in which case
3927          we update it).  */
3928       for (insn = insns; insn; insn = NEXT_INSN (insn))
3929         if (CALL_P (insn))
3930           make_reg_eh_region_note_nothrow_nononlocal (insn);
3931     }
3932
3933   /* First emit all insns that set pseudos.  Remove them from the list as
3934      we go.  Avoid insns that set pseudos which were referenced in previous
3935      insns.  These can be generated by move_by_pieces, for example,
3936      to update an address.  Similarly, avoid insns that reference things
3937      set in previous insns.  */
3938
3939   for (insn = insns; insn; insn = next)
3940     {
3941       rtx set = single_set (insn);
3942
3943       next = NEXT_INSN (insn);
3944
3945       if (set != 0 && REG_P (SET_DEST (set))
3946           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3947         {
3948           struct no_conflict_data data;
3949
3950           data.target = const0_rtx;
3951           data.first = insns;
3952           data.insn = insn;
3953           data.must_stay = 0;
3954           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3955           if (! data.must_stay)
3956             {
3957               if (PREV_INSN (insn))
3958                 SET_NEXT_INSN (PREV_INSN (insn)) = next;
3959               else
3960                 insns = next;
3961
3962               if (next)
3963                 SET_PREV_INSN (next) = PREV_INSN (insn);
3964
3965               add_insn (insn);
3966             }
3967         }
3968
3969       /* Some ports use a loop to copy large arguments onto the stack.
3970          Don't move anything outside such a loop.  */
3971       if (LABEL_P (insn))
3972         break;
3973     }
3974
3975   /* Write the remaining insns followed by the final copy.  */
3976   for (insn = insns; insn; insn = next)
3977     {
3978       next = NEXT_INSN (insn);
3979
3980       add_insn (insn);
3981     }
3982
3983   last = emit_move_insn (target, result);
3984   set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3985
3986   if (final_dest != target)
3987     emit_move_insn (final_dest, target);
3988 }
3989
3990 void
3991 emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
3992 {
3993   emit_libcall_block_1 (safe_as_a <rtx_insn *> (insns),
3994                         target, result, equiv, false);
3995 }
3996 \f
3997 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3998    PURPOSE describes how this comparison will be used.  CODE is the rtx
3999    comparison code we will be using.
4000
4001    ??? Actually, CODE is slightly weaker than that.  A target is still
4002    required to implement all of the normal bcc operations, but not
4003    required to implement all (or any) of the unordered bcc operations.  */
4004
4005 int
4006 can_compare_p (enum rtx_code code, machine_mode mode,
4007                enum can_compare_purpose purpose)
4008 {
4009   rtx test;
4010   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
4011   do
4012     {
4013       enum insn_code icode;
4014
4015       if (purpose == ccp_jump
4016           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
4017           && insn_operand_matches (icode, 0, test))
4018         return 1;
4019       if (purpose == ccp_store_flag
4020           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
4021           && insn_operand_matches (icode, 1, test))
4022         return 1;
4023       if (purpose == ccp_cmov
4024           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
4025         return 1;
4026
4027       mode = GET_MODE_WIDER_MODE (mode);
4028       PUT_MODE (test, mode);
4029     }
4030   while (mode != VOIDmode);
4031
4032   return 0;
4033 }
4034
4035 /* This function is called when we are going to emit a compare instruction that
4036    compares the values found in *PX and *PY, using the rtl operator COMPARISON.
4037
4038    *PMODE is the mode of the inputs (in case they are const_int).
4039    *PUNSIGNEDP nonzero says that the operands are unsigned;
4040    this matters if they need to be widened (as given by METHODS).
4041
4042    If they have mode BLKmode, then SIZE specifies the size of both operands.
4043
4044    This function performs all the setup necessary so that the caller only has
4045    to emit a single comparison insn.  This setup can involve doing a BLKmode
4046    comparison or emitting a library call to perform the comparison if no insn
4047    is available to handle it.
4048    The values which are passed in through pointers can be modified; the caller
4049    should perform the comparison on the modified values.  Constant
4050    comparisons must have already been folded.  */
4051
4052 static void
4053 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
4054                   int unsignedp, enum optab_methods methods,
4055                   rtx *ptest, machine_mode *pmode)
4056 {
4057   machine_mode mode = *pmode;
4058   rtx libfunc, test;
4059   machine_mode cmp_mode;
4060   enum mode_class mclass;
4061
4062   /* The other methods are not needed.  */
4063   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
4064               || methods == OPTAB_LIB_WIDEN);
4065
4066   /* If we are optimizing, force expensive constants into a register.  */
4067   if (CONSTANT_P (x) && optimize
4068       && (rtx_cost (x, COMPARE, 0, optimize_insn_for_speed_p ())
4069           > COSTS_N_INSNS (1)))
4070     x = force_reg (mode, x);
4071
4072   if (CONSTANT_P (y) && optimize
4073       && (rtx_cost (y, COMPARE, 1, optimize_insn_for_speed_p ())
4074           > COSTS_N_INSNS (1)))
4075     y = force_reg (mode, y);
4076
4077 #if HAVE_cc0
4078   /* Make sure if we have a canonical comparison.  The RTL
4079      documentation states that canonical comparisons are required only
4080      for targets which have cc0.  */
4081   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
4082 #endif
4083
4084   /* Don't let both operands fail to indicate the mode.  */
4085   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
4086     x = force_reg (mode, x);
4087   if (mode == VOIDmode)
4088     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
4089
4090   /* Handle all BLKmode compares.  */
4091
4092   if (mode == BLKmode)
4093     {
4094       machine_mode result_mode;
4095       enum insn_code cmp_code;
4096       tree length_type;
4097       rtx libfunc;
4098       rtx result;
4099       rtx opalign
4100         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
4101
4102       gcc_assert (size);
4103
4104       /* Try to use a memory block compare insn - either cmpstr
4105          or cmpmem will do.  */
4106       for (cmp_mode = GET_CLASS_NARROWEST_MODE (MODE_INT);
4107            cmp_mode != VOIDmode;
4108            cmp_mode = GET_MODE_WIDER_MODE (cmp_mode))
4109         {
4110           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
4111           if (cmp_code == CODE_FOR_nothing)
4112             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
4113           if (cmp_code == CODE_FOR_nothing)
4114             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
4115           if (cmp_code == CODE_FOR_nothing)
4116             continue;
4117
4118           /* Must make sure the size fits the insn's mode.  */
4119           if ((CONST_INT_P (size)
4120                && INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode)))
4121               || (GET_MODE_BITSIZE (GET_MODE (size))
4122                   > GET_MODE_BITSIZE (cmp_mode)))
4123             continue;
4124
4125           result_mode = insn_data[cmp_code].operand[0].mode;
4126           result = gen_reg_rtx (result_mode);
4127           size = convert_to_mode (cmp_mode, size, 1);
4128           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
4129
4130           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
4131           *pmode = result_mode;
4132           return;
4133         }
4134
4135       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
4136         goto fail;
4137
4138       /* Otherwise call a library function, memcmp.  */
4139       libfunc = memcmp_libfunc;
4140       length_type = sizetype;
4141       result_mode = TYPE_MODE (integer_type_node);
4142       cmp_mode = TYPE_MODE (length_type);
4143       size = convert_to_mode (TYPE_MODE (length_type), size,
4144                               TYPE_UNSIGNED (length_type));
4145
4146       result = emit_library_call_value (libfunc, 0, LCT_PURE,
4147                                         result_mode, 3,
4148                                         XEXP (x, 0), Pmode,
4149                                         XEXP (y, 0), Pmode,
4150                                         size, cmp_mode);
4151       x = result;
4152       y = const0_rtx;
4153       mode = result_mode;
4154       methods = OPTAB_LIB_WIDEN;
4155       unsignedp = false;
4156     }
4157
4158   /* Don't allow operands to the compare to trap, as that can put the
4159      compare and branch in different basic blocks.  */
4160   if (cfun->can_throw_non_call_exceptions)
4161     {
4162       if (may_trap_p (x))
4163         x = force_reg (mode, x);
4164       if (may_trap_p (y))
4165         y = force_reg (mode, y);
4166     }
4167
4168   if (GET_MODE_CLASS (mode) == MODE_CC)
4169     {
4170       enum insn_code icode = optab_handler (cbranch_optab, CCmode);
4171       test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4172       gcc_assert (icode != CODE_FOR_nothing
4173                   && insn_operand_matches (icode, 0, test));
4174       *ptest = test;
4175       return;
4176     }
4177
4178   mclass = GET_MODE_CLASS (mode);
4179   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4180   cmp_mode = mode;
4181   do
4182    {
4183       enum insn_code icode;
4184       icode = optab_handler (cbranch_optab, cmp_mode);
4185       if (icode != CODE_FOR_nothing
4186           && insn_operand_matches (icode, 0, test))
4187         {
4188           rtx_insn *last = get_last_insn ();
4189           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
4190           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
4191           if (op0 && op1
4192               && insn_operand_matches (icode, 1, op0)
4193               && insn_operand_matches (icode, 2, op1))
4194             {
4195               XEXP (test, 0) = op0;
4196               XEXP (test, 1) = op1;
4197               *ptest = test;
4198               *pmode = cmp_mode;
4199               return;
4200             }
4201           delete_insns_since (last);
4202         }
4203
4204       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
4205         break;
4206       cmp_mode = GET_MODE_WIDER_MODE (cmp_mode);
4207     }
4208   while (cmp_mode != VOIDmode);
4209
4210   if (methods != OPTAB_LIB_WIDEN)
4211     goto fail;
4212
4213   if (!SCALAR_FLOAT_MODE_P (mode))
4214     {
4215       rtx result;
4216       machine_mode ret_mode;
4217
4218       /* Handle a libcall just for the mode we are using.  */
4219       libfunc = optab_libfunc (cmp_optab, mode);
4220       gcc_assert (libfunc);
4221
4222       /* If we want unsigned, and this mode has a distinct unsigned
4223          comparison routine, use that.  */
4224       if (unsignedp)
4225         {
4226           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
4227           if (ulibfunc)
4228             libfunc = ulibfunc;
4229         }
4230
4231       ret_mode = targetm.libgcc_cmp_return_mode ();
4232       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4233                                         ret_mode, 2, x, mode, y, mode);
4234
4235       /* There are two kinds of comparison routines. Biased routines
4236          return 0/1/2, and unbiased routines return -1/0/1. Other parts
4237          of gcc expect that the comparison operation is equivalent
4238          to the modified comparison. For signed comparisons compare the
4239          result against 1 in the biased case, and zero in the unbiased
4240          case. For unsigned comparisons always compare against 1 after
4241          biasing the unbiased result by adding 1. This gives us a way to
4242          represent LTU.
4243          The comparisons in the fixed-point helper library are always
4244          biased.  */
4245       x = result;
4246       y = const1_rtx;
4247
4248       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4249         {
4250           if (unsignedp)
4251             x = plus_constant (ret_mode, result, 1);
4252           else
4253             y = const0_rtx;
4254         }
4255
4256       *pmode = ret_mode;
4257       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4258                         ptest, pmode);
4259     }
4260   else
4261     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
4262
4263   return;
4264
4265  fail:
4266   *ptest = NULL_RTX;
4267 }
4268
4269 /* Before emitting an insn with code ICODE, make sure that X, which is going
4270    to be used for operand OPNUM of the insn, is converted from mode MODE to
4271    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4272    that it is accepted by the operand predicate.  Return the new value.  */
4273
4274 rtx
4275 prepare_operand (enum insn_code icode, rtx x, int opnum, machine_mode mode,
4276                  machine_mode wider_mode, int unsignedp)
4277 {
4278   if (mode != wider_mode)
4279     x = convert_modes (wider_mode, mode, x, unsignedp);
4280
4281   if (!insn_operand_matches (icode, opnum, x))
4282     {
4283       machine_mode op_mode = insn_data[(int) icode].operand[opnum].mode;
4284       if (reload_completed)
4285         return NULL_RTX;
4286       if (GET_MODE (x) != op_mode && GET_MODE (x) != VOIDmode)
4287         return NULL_RTX;
4288       x = copy_to_mode_reg (op_mode, x);
4289     }
4290
4291   return x;
4292 }
4293
4294 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4295    we can do the branch.  */
4296
4297 static void
4298 emit_cmp_and_jump_insn_1 (rtx test, machine_mode mode, rtx label, int prob)
4299 {
4300   machine_mode optab_mode;
4301   enum mode_class mclass;
4302   enum insn_code icode;
4303   rtx_insn *insn;
4304
4305   mclass = GET_MODE_CLASS (mode);
4306   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4307   icode = optab_handler (cbranch_optab, optab_mode);
4308
4309   gcc_assert (icode != CODE_FOR_nothing);
4310   gcc_assert (insn_operand_matches (icode, 0, test));
4311   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4312                                           XEXP (test, 1), label));
4313   if (prob != -1
4314       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4315       && insn
4316       && JUMP_P (insn)
4317       && any_condjump_p (insn)
4318       && !find_reg_note (insn, REG_BR_PROB, 0))
4319     add_int_reg_note (insn, REG_BR_PROB, prob);
4320 }
4321
4322 /* Generate code to compare X with Y so that the condition codes are
4323    set and to jump to LABEL if the condition is true.  If X is a
4324    constant and Y is not a constant, then the comparison is swapped to
4325    ensure that the comparison RTL has the canonical form.
4326
4327    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4328    need to be widened.  UNSIGNEDP is also used to select the proper
4329    branch condition code.
4330
4331    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4332
4333    MODE is the mode of the inputs (in case they are const_int).
4334
4335    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4336    It will be potentially converted into an unsigned variant based on
4337    UNSIGNEDP to select a proper jump instruction.
4338
4339    PROB is the probability of jumping to LABEL.  */
4340
4341 void
4342 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4343                          machine_mode mode, int unsignedp, rtx label,
4344                          int prob)
4345 {
4346   rtx op0 = x, op1 = y;
4347   rtx test;
4348
4349   /* Swap operands and condition to ensure canonical RTL.  */
4350   if (swap_commutative_operands_p (x, y)
4351       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4352     {
4353       op0 = y, op1 = x;
4354       comparison = swap_condition (comparison);
4355     }
4356
4357   /* If OP0 is still a constant, then both X and Y must be constants
4358      or the opposite comparison is not supported.  Force X into a register
4359      to create canonical RTL.  */
4360   if (CONSTANT_P (op0))
4361     op0 = force_reg (mode, op0);
4362
4363   if (unsignedp)
4364     comparison = unsigned_condition (comparison);
4365
4366   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4367                     &test, &mode);
4368   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4369 }
4370
4371 \f
4372 /* Emit a library call comparison between floating point X and Y.
4373    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4374
4375 static void
4376 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4377                        rtx *ptest, machine_mode *pmode)
4378 {
4379   enum rtx_code swapped = swap_condition (comparison);
4380   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4381   machine_mode orig_mode = GET_MODE (x);
4382   machine_mode mode, cmp_mode;
4383   rtx true_rtx, false_rtx;
4384   rtx value, target, equiv;
4385   rtx_insn *insns;
4386   rtx libfunc = 0;
4387   bool reversed_p = false;
4388   cmp_mode = targetm.libgcc_cmp_return_mode ();
4389
4390   for (mode = orig_mode;
4391        mode != VOIDmode;
4392        mode = GET_MODE_WIDER_MODE (mode))
4393     {
4394       if (code_to_optab (comparison)
4395           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4396         break;
4397
4398       if (code_to_optab (swapped)
4399           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4400         {
4401           rtx tmp;
4402           tmp = x; x = y; y = tmp;
4403           comparison = swapped;
4404           break;
4405         }
4406
4407       if (code_to_optab (reversed)
4408           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4409         {
4410           comparison = reversed;
4411           reversed_p = true;
4412           break;
4413         }
4414     }
4415
4416   gcc_assert (mode != VOIDmode);
4417
4418   if (mode != orig_mode)
4419     {
4420       x = convert_to_mode (mode, x, 0);
4421       y = convert_to_mode (mode, y, 0);
4422     }
4423
4424   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4425      the RTL.  The allows the RTL optimizers to delete the libcall if the
4426      condition can be determined at compile-time.  */
4427   if (comparison == UNORDERED
4428       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4429     {
4430       true_rtx = const_true_rtx;
4431       false_rtx = const0_rtx;
4432     }
4433   else
4434     {
4435       switch (comparison)
4436         {
4437         case EQ:
4438           true_rtx = const0_rtx;
4439           false_rtx = const_true_rtx;
4440           break;
4441
4442         case NE:
4443           true_rtx = const_true_rtx;
4444           false_rtx = const0_rtx;
4445           break;
4446
4447         case GT:
4448           true_rtx = const1_rtx;
4449           false_rtx = const0_rtx;
4450           break;
4451
4452         case GE:
4453           true_rtx = const0_rtx;
4454           false_rtx = constm1_rtx;
4455           break;
4456
4457         case LT:
4458           true_rtx = constm1_rtx;
4459           false_rtx = const0_rtx;
4460           break;
4461
4462         case LE:
4463           true_rtx = const0_rtx;
4464           false_rtx = const1_rtx;
4465           break;
4466
4467         default:
4468           gcc_unreachable ();
4469         }
4470     }
4471
4472   if (comparison == UNORDERED)
4473     {
4474       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4475       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4476       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4477                                     temp, const_true_rtx, equiv);
4478     }
4479   else
4480     {
4481       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4482       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4483         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4484                                       equiv, true_rtx, false_rtx);
4485     }
4486
4487   start_sequence ();
4488   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4489                                    cmp_mode, 2, x, mode, y, mode);
4490   insns = get_insns ();
4491   end_sequence ();
4492
4493   target = gen_reg_rtx (cmp_mode);
4494   emit_libcall_block (insns, target, value, equiv);
4495
4496   if (comparison == UNORDERED
4497       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4498       || reversed_p)
4499     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4500   else
4501     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4502
4503   *pmode = cmp_mode;
4504 }
4505 \f
4506 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4507
4508 void
4509 emit_indirect_jump (rtx loc ATTRIBUTE_UNUSED)
4510 {
4511 #ifndef HAVE_indirect_jump
4512   sorry ("indirect jumps are not available on this target");
4513 #else
4514   struct expand_operand ops[1];
4515   create_address_operand (&ops[0], loc);
4516   expand_jump_insn (CODE_FOR_indirect_jump, 1, ops);
4517   emit_barrier ();
4518 #endif
4519 }
4520 \f
4521 #ifdef HAVE_conditional_move
4522
4523 /* Emit a conditional move instruction if the machine supports one for that
4524    condition and machine mode.
4525
4526    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4527    the mode to use should they be constants.  If it is VOIDmode, they cannot
4528    both be constants.
4529
4530    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4531    should be stored there.  MODE is the mode to use should they be constants.
4532    If it is VOIDmode, they cannot both be constants.
4533
4534    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4535    is not supported.  */
4536
4537 rtx
4538 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4539                        machine_mode cmode, rtx op2, rtx op3,
4540                        machine_mode mode, int unsignedp)
4541 {
4542   rtx comparison;
4543   rtx_insn *last;
4544   enum insn_code icode;
4545   enum rtx_code reversed;
4546
4547   /* If one operand is constant, make it the second one.  Only do this
4548      if the other operand is not constant as well.  */
4549
4550   if (swap_commutative_operands_p (op0, op1))
4551     {
4552       std::swap (op0, op1);
4553       code = swap_condition (code);
4554     }
4555
4556   /* get_condition will prefer to generate LT and GT even if the old
4557      comparison was against zero, so undo that canonicalization here since
4558      comparisons against zero are cheaper.  */
4559   if (code == LT && op1 == const1_rtx)
4560     code = LE, op1 = const0_rtx;
4561   else if (code == GT && op1 == constm1_rtx)
4562     code = GE, op1 = const0_rtx;
4563
4564   if (cmode == VOIDmode)
4565     cmode = GET_MODE (op0);
4566
4567   if (swap_commutative_operands_p (op2, op3)
4568       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4569           != UNKNOWN))
4570     {
4571       std::swap (op2, op3);
4572       code = reversed;
4573     }
4574
4575   if (mode == VOIDmode)
4576     mode = GET_MODE (op2);
4577
4578   icode = direct_optab_handler (movcc_optab, mode);
4579
4580   if (icode == CODE_FOR_nothing)
4581     return 0;
4582
4583   if (!target)
4584     target = gen_reg_rtx (mode);
4585
4586   code = unsignedp ? unsigned_condition (code) : code;
4587   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4588
4589   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4590      return NULL and let the caller figure out how best to deal with this
4591      situation.  */
4592   if (!COMPARISON_P (comparison))
4593     return NULL_RTX;
4594
4595   saved_pending_stack_adjust save;
4596   save_pending_stack_adjust (&save);
4597   last = get_last_insn ();
4598   do_pending_stack_adjust ();
4599   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4600                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4601                     &comparison, &cmode);
4602   if (comparison)
4603     {
4604       struct expand_operand ops[4];
4605
4606       create_output_operand (&ops[0], target, mode);
4607       create_fixed_operand (&ops[1], comparison);
4608       create_input_operand (&ops[2], op2, mode);
4609       create_input_operand (&ops[3], op3, mode);
4610       if (maybe_expand_insn (icode, 4, ops))
4611         {
4612           if (ops[0].value != target)
4613             convert_move (target, ops[0].value, false);
4614           return target;
4615         }
4616     }
4617   delete_insns_since (last);
4618   restore_pending_stack_adjust (&save);
4619   return NULL_RTX;
4620 }
4621
4622 /* Return nonzero if a conditional move of mode MODE is supported.
4623
4624    This function is for combine so it can tell whether an insn that looks
4625    like a conditional move is actually supported by the hardware.  If we
4626    guess wrong we lose a bit on optimization, but that's it.  */
4627 /* ??? sparc64 supports conditionally moving integers values based on fp
4628    comparisons, and vice versa.  How do we handle them?  */
4629
4630 int
4631 can_conditionally_move_p (machine_mode mode)
4632 {
4633   if (direct_optab_handler (movcc_optab, mode) != CODE_FOR_nothing)
4634     return 1;
4635
4636   return 0;
4637 }
4638
4639 #endif /* HAVE_conditional_move */
4640
4641 /* Emit a conditional addition instruction if the machine supports one for that
4642    condition and machine mode.
4643
4644    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4645    the mode to use should they be constants.  If it is VOIDmode, they cannot
4646    both be constants.
4647
4648    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4649    should be stored there.  MODE is the mode to use should they be constants.
4650    If it is VOIDmode, they cannot both be constants.
4651
4652    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4653    is not supported.  */
4654
4655 rtx
4656 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4657                       machine_mode cmode, rtx op2, rtx op3,
4658                       machine_mode mode, int unsignedp)
4659 {
4660   rtx comparison;
4661   rtx_insn *last;
4662   enum insn_code icode;
4663
4664   /* If one operand is constant, make it the second one.  Only do this
4665      if the other operand is not constant as well.  */
4666
4667   if (swap_commutative_operands_p (op0, op1))
4668     {
4669       std::swap (op0, op1);
4670       code = swap_condition (code);
4671     }
4672
4673   /* get_condition will prefer to generate LT and GT even if the old
4674      comparison was against zero, so undo that canonicalization here since
4675      comparisons against zero are cheaper.  */
4676   if (code == LT && op1 == const1_rtx)
4677     code = LE, op1 = const0_rtx;
4678   else if (code == GT && op1 == constm1_rtx)
4679     code = GE, op1 = const0_rtx;
4680
4681   if (cmode == VOIDmode)
4682     cmode = GET_MODE (op0);
4683
4684   if (mode == VOIDmode)
4685     mode = GET_MODE (op2);
4686
4687   icode = optab_handler (addcc_optab, mode);
4688
4689   if (icode == CODE_FOR_nothing)
4690     return 0;
4691
4692   if (!target)
4693     target = gen_reg_rtx (mode);
4694
4695   code = unsignedp ? unsigned_condition (code) : code;
4696   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4697
4698   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4699      return NULL and let the caller figure out how best to deal with this
4700      situation.  */
4701   if (!COMPARISON_P (comparison))
4702     return NULL_RTX;
4703
4704   do_pending_stack_adjust ();
4705   last = get_last_insn ();
4706   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4707                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4708                     &comparison, &cmode);
4709   if (comparison)
4710     {
4711       struct expand_operand ops[4];
4712
4713       create_output_operand (&ops[0], target, mode);
4714       create_fixed_operand (&ops[1], comparison);
4715       create_input_operand (&ops[2], op2, mode);
4716       create_input_operand (&ops[3], op3, mode);
4717       if (maybe_expand_insn (icode, 4, ops))
4718         {
4719           if (ops[0].value != target)
4720             convert_move (target, ops[0].value, false);
4721           return target;
4722         }
4723     }
4724   delete_insns_since (last);
4725   return NULL_RTX;
4726 }
4727 \f
4728 /* These functions attempt to generate an insn body, rather than
4729    emitting the insn, but if the gen function already emits them, we
4730    make no attempt to turn them back into naked patterns.  */
4731
4732 /* Generate and return an insn body to add Y to X.  */
4733
4734 rtx
4735 gen_add2_insn (rtx x, rtx y)
4736 {
4737   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4738
4739   gcc_assert (insn_operand_matches (icode, 0, x));
4740   gcc_assert (insn_operand_matches (icode, 1, x));
4741   gcc_assert (insn_operand_matches (icode, 2, y));
4742
4743   return GEN_FCN (icode) (x, x, y);
4744 }
4745
4746 /* Generate and return an insn body to add r1 and c,
4747    storing the result in r0.  */
4748
4749 rtx
4750 gen_add3_insn (rtx r0, rtx r1, rtx c)
4751 {
4752   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4753
4754   if (icode == CODE_FOR_nothing
4755       || !insn_operand_matches (icode, 0, r0)
4756       || !insn_operand_matches (icode, 1, r1)
4757       || !insn_operand_matches (icode, 2, c))
4758     return NULL_RTX;
4759
4760   return GEN_FCN (icode) (r0, r1, c);
4761 }
4762
4763 int
4764 have_add2_insn (rtx x, rtx y)
4765 {
4766   enum insn_code icode;
4767
4768   gcc_assert (GET_MODE (x) != VOIDmode);
4769
4770   icode = optab_handler (add_optab, GET_MODE (x));
4771
4772   if (icode == CODE_FOR_nothing)
4773     return 0;
4774
4775   if (!insn_operand_matches (icode, 0, x)
4776       || !insn_operand_matches (icode, 1, x)
4777       || !insn_operand_matches (icode, 2, y))
4778     return 0;
4779
4780   return 1;
4781 }
4782
4783 /* Generate and return an insn body to add Y to X.  */
4784
4785 rtx
4786 gen_addptr3_insn (rtx x, rtx y, rtx z)
4787 {
4788   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4789
4790   gcc_assert (insn_operand_matches (icode, 0, x));
4791   gcc_assert (insn_operand_matches (icode, 1, y));
4792   gcc_assert (insn_operand_matches (icode, 2, z));
4793
4794   return GEN_FCN (icode) (x, y, z);
4795 }
4796
4797 /* Return true if the target implements an addptr pattern and X, Y,
4798    and Z are valid for the pattern predicates.  */
4799
4800 int
4801 have_addptr3_insn (rtx x, rtx y, rtx z)
4802 {
4803   enum insn_code icode;
4804
4805   gcc_assert (GET_MODE (x) != VOIDmode);
4806
4807   icode = optab_handler (addptr3_optab, GET_MODE (x));
4808
4809   if (icode == CODE_FOR_nothing)
4810     return 0;
4811
4812   if (!insn_operand_matches (icode, 0, x)
4813       || !insn_operand_matches (icode, 1, y)
4814       || !insn_operand_matches (icode, 2, z))
4815     return 0;
4816
4817   return 1;
4818 }
4819
4820 /* Generate and return an insn body to subtract Y from X.  */
4821
4822 rtx
4823 gen_sub2_insn (rtx x, rtx y)
4824 {
4825   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4826
4827   gcc_assert (insn_operand_matches (icode, 0, x));
4828   gcc_assert (insn_operand_matches (icode, 1, x));
4829   gcc_assert (insn_operand_matches (icode, 2, y));
4830
4831   return GEN_FCN (icode) (x, x, y);
4832 }
4833
4834 /* Generate and return an insn body to subtract r1 and c,
4835    storing the result in r0.  */
4836
4837 rtx
4838 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4839 {
4840   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4841
4842   if (icode == CODE_FOR_nothing
4843       || !insn_operand_matches (icode, 0, r0)
4844       || !insn_operand_matches (icode, 1, r1)
4845       || !insn_operand_matches (icode, 2, c))
4846     return NULL_RTX;
4847
4848   return GEN_FCN (icode) (r0, r1, c);
4849 }
4850
4851 int
4852 have_sub2_insn (rtx x, rtx y)
4853 {
4854   enum insn_code icode;
4855
4856   gcc_assert (GET_MODE (x) != VOIDmode);
4857
4858   icode = optab_handler (sub_optab, GET_MODE (x));
4859
4860   if (icode == CODE_FOR_nothing)
4861     return 0;
4862
4863   if (!insn_operand_matches (icode, 0, x)
4864       || !insn_operand_matches (icode, 1, x)
4865       || !insn_operand_matches (icode, 2, y))
4866     return 0;
4867
4868   return 1;
4869 }
4870 \f
4871 /* Return the insn code used to extend FROM_MODE to TO_MODE.
4872    UNSIGNEDP specifies zero-extension instead of sign-extension.  If
4873    no such operation exists, CODE_FOR_nothing will be returned.  */
4874
4875 enum insn_code
4876 can_extend_p (machine_mode to_mode, machine_mode from_mode,
4877               int unsignedp)
4878 {
4879   convert_optab tab;
4880 #ifdef HAVE_ptr_extend
4881   if (unsignedp < 0)
4882     return CODE_FOR_ptr_extend;
4883 #endif
4884
4885   tab = unsignedp ? zext_optab : sext_optab;
4886   return convert_optab_handler (tab, to_mode, from_mode);
4887 }
4888
4889 /* Generate the body of an insn to extend Y (with mode MFROM)
4890    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4891
4892 rtx
4893 gen_extend_insn (rtx x, rtx y, machine_mode mto,
4894                  machine_mode mfrom, int unsignedp)
4895 {
4896   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4897   return GEN_FCN (icode) (x, y);
4898 }
4899 \f
4900 /* can_fix_p and can_float_p say whether the target machine
4901    can directly convert a given fixed point type to
4902    a given floating point type, or vice versa.
4903    The returned value is the CODE_FOR_... value to use,
4904    or CODE_FOR_nothing if these modes cannot be directly converted.
4905
4906    *TRUNCP_PTR is set to 1 if it is necessary to output
4907    an explicit FTRUNC insn before the fix insn; otherwise 0.  */
4908
4909 static enum insn_code
4910 can_fix_p (machine_mode fixmode, machine_mode fltmode,
4911            int unsignedp, int *truncp_ptr)
4912 {
4913   convert_optab tab;
4914   enum insn_code icode;
4915
4916   tab = unsignedp ? ufixtrunc_optab : sfixtrunc_optab;
4917   icode = convert_optab_handler (tab, fixmode, fltmode);
4918   if (icode != CODE_FOR_nothing)
4919     {
4920       *truncp_ptr = 0;
4921       return icode;
4922     }
4923
4924   /* FIXME: This requires a port to define both FIX and FTRUNC pattern
4925      for this to work. We need to rework the fix* and ftrunc* patterns
4926      and documentation.  */
4927   tab = unsignedp ? ufix_optab : sfix_optab;
4928   icode = convert_optab_handler (tab, fixmode, fltmode);
4929   if (icode != CODE_FOR_nothing
4930       && optab_handler (ftrunc_optab, fltmode) != CODE_FOR_nothing)
4931     {
4932       *truncp_ptr = 1;
4933       return icode;
4934     }
4935
4936   *truncp_ptr = 0;
4937   return CODE_FOR_nothing;
4938 }
4939
4940 enum insn_code
4941 can_float_p (machine_mode fltmode, machine_mode fixmode,
4942              int unsignedp)
4943 {
4944   convert_optab tab;
4945
4946   tab = unsignedp ? ufloat_optab : sfloat_optab;
4947   return convert_optab_handler (tab, fltmode, fixmode);
4948 }
4949
4950 /* Function supportable_convert_operation
4951
4952    Check whether an operation represented by the code CODE is a
4953    convert operation that is supported by the target platform in
4954    vector form (i.e., when operating on arguments of type VECTYPE_IN
4955    producing a result of type VECTYPE_OUT).
4956
4957    Convert operations we currently support directly are FIX_TRUNC and FLOAT.
4958    This function checks if these operations are supported
4959    by the target platform either directly (via vector tree-codes), or via
4960    target builtins.
4961
4962    Output:
4963    - CODE1 is code of vector operation to be used when
4964    vectorizing the operation, if available.
4965    - DECL is decl of target builtin functions to be used
4966    when vectorizing the operation, if available.  In this case,
4967    CODE1 is CALL_EXPR.  */
4968
4969 bool
4970 supportable_convert_operation (enum tree_code code,
4971                                     tree vectype_out, tree vectype_in,
4972                                     tree *decl, enum tree_code *code1)
4973 {
4974   machine_mode m1,m2;
4975   int truncp;
4976
4977   m1 = TYPE_MODE (vectype_out);
4978   m2 = TYPE_MODE (vectype_in);
4979
4980   /* First check if we can done conversion directly.  */
4981   if ((code == FIX_TRUNC_EXPR
4982        && can_fix_p (m1,m2,TYPE_UNSIGNED (vectype_out), &truncp)
4983           != CODE_FOR_nothing)
4984       || (code == FLOAT_EXPR
4985           && can_float_p (m1,m2,TYPE_UNSIGNED (vectype_in))
4986              != CODE_FOR_nothing))
4987     {
4988       *code1 = code;
4989       return true;
4990     }
4991
4992   /* Now check for builtin.  */
4993   if (targetm.vectorize.builtin_conversion
4994       && targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in))
4995     {
4996       *code1 = CALL_EXPR;
4997       *decl = targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in);
4998       return true;
4999     }
5000   return false;
5001 }
5002
5003 \f
5004 /* Generate code to convert FROM to floating point
5005    and store in TO.  FROM must be fixed point and not VOIDmode.
5006    UNSIGNEDP nonzero means regard FROM as unsigned.
5007    Normally this is done by correcting the final value
5008    if it is negative.  */
5009
5010 void
5011 expand_float (rtx to, rtx from, int unsignedp)
5012 {
5013   enum insn_code icode;
5014   rtx target = to;
5015   machine_mode fmode, imode;
5016   bool can_do_signed = false;
5017
5018   /* Crash now, because we won't be able to decide which mode to use.  */
5019   gcc_assert (GET_MODE (from) != VOIDmode);
5020
5021   /* Look for an insn to do the conversion.  Do it in the specified
5022      modes if possible; otherwise convert either input, output or both to
5023      wider mode.  If the integer mode is wider than the mode of FROM,
5024      we can do the conversion signed even if the input is unsigned.  */
5025
5026   for (fmode = GET_MODE (to); fmode != VOIDmode;
5027        fmode = GET_MODE_WIDER_MODE (fmode))
5028     for (imode = GET_MODE (from); imode != VOIDmode;
5029          imode = GET_MODE_WIDER_MODE (imode))
5030       {
5031         int doing_unsigned = unsignedp;
5032
5033         if (fmode != GET_MODE (to)
5034             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
5035           continue;
5036
5037         icode = can_float_p (fmode, imode, unsignedp);
5038         if (icode == CODE_FOR_nothing && unsignedp)
5039           {
5040             enum insn_code scode = can_float_p (fmode, imode, 0);
5041             if (scode != CODE_FOR_nothing)
5042               can_do_signed = true;
5043             if (imode != GET_MODE (from))
5044               icode = scode, doing_unsigned = 0;
5045           }
5046
5047         if (icode != CODE_FOR_nothing)
5048           {
5049             if (imode != GET_MODE (from))
5050               from = convert_to_mode (imode, from, unsignedp);
5051
5052             if (fmode != GET_MODE (to))
5053               target = gen_reg_rtx (fmode);
5054
5055             emit_unop_insn (icode, target, from,
5056                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
5057
5058             if (target != to)
5059               convert_move (to, target, 0);
5060             return;
5061           }
5062       }
5063
5064   /* Unsigned integer, and no way to convert directly.  Convert as signed,
5065      then unconditionally adjust the result.  */
5066   if (unsignedp && can_do_signed)
5067     {
5068       rtx_code_label *label = gen_label_rtx ();
5069       rtx temp;
5070       REAL_VALUE_TYPE offset;
5071
5072       /* Look for a usable floating mode FMODE wider than the source and at
5073          least as wide as the target.  Using FMODE will avoid rounding woes
5074          with unsigned values greater than the signed maximum value.  */
5075
5076       for (fmode = GET_MODE (to);  fmode != VOIDmode;
5077            fmode = GET_MODE_WIDER_MODE (fmode))
5078         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
5079             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
5080           break;
5081
5082       if (fmode == VOIDmode)
5083         {
5084           /* There is no such mode.  Pretend the target is wide enough.  */
5085           fmode = GET_MODE (to);
5086
5087           /* Avoid double-rounding when TO is narrower than FROM.  */
5088           if ((significand_size (fmode) + 1)
5089               < GET_MODE_PRECISION (GET_MODE (from)))
5090             {
5091               rtx temp1;
5092               rtx_code_label *neglabel = gen_label_rtx ();
5093
5094               /* Don't use TARGET if it isn't a register, is a hard register,
5095                  or is the wrong mode.  */
5096               if (!REG_P (target)
5097                   || REGNO (target) < FIRST_PSEUDO_REGISTER
5098                   || GET_MODE (target) != fmode)
5099                 target = gen_reg_rtx (fmode);
5100
5101               imode = GET_MODE (from);
5102               do_pending_stack_adjust ();
5103
5104               /* Test whether the sign bit is set.  */
5105               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
5106                                        0, neglabel);
5107
5108               /* The sign bit is not set.  Convert as signed.  */
5109               expand_float (target, from, 0);
5110               emit_jump_insn (gen_jump (label));
5111               emit_barrier ();
5112
5113               /* The sign bit is set.
5114                  Convert to a usable (positive signed) value by shifting right
5115                  one bit, while remembering if a nonzero bit was shifted
5116                  out; i.e., compute  (from & 1) | (from >> 1).  */
5117
5118               emit_label (neglabel);
5119               temp = expand_binop (imode, and_optab, from, const1_rtx,
5120                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
5121               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
5122               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
5123                                    OPTAB_LIB_WIDEN);
5124               expand_float (target, temp, 0);
5125
5126               /* Multiply by 2 to undo the shift above.  */
5127               temp = expand_binop (fmode, add_optab, target, target,
5128                                    target, 0, OPTAB_LIB_WIDEN);
5129               if (temp != target)
5130                 emit_move_insn (target, temp);
5131
5132               do_pending_stack_adjust ();
5133               emit_label (label);
5134               goto done;
5135             }
5136         }
5137
5138       /* If we are about to do some arithmetic to correct for an
5139          unsigned operand, do it in a pseudo-register.  */
5140
5141       if (GET_MODE (to) != fmode
5142           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
5143         target = gen_reg_rtx (fmode);
5144
5145       /* Convert as signed integer to floating.  */
5146       expand_float (target, from, 0);
5147
5148       /* If FROM is negative (and therefore TO is negative),
5149          correct its value by 2**bitwidth.  */
5150
5151       do_pending_stack_adjust ();
5152       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
5153                                0, label);
5154
5155
5156       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
5157       temp = expand_binop (fmode, add_optab, target,
5158                            CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode),
5159                            target, 0, OPTAB_LIB_WIDEN);
5160       if (temp != target)
5161         emit_move_insn (target, temp);
5162
5163       do_pending_stack_adjust ();
5164       emit_label (label);
5165       goto done;
5166     }
5167
5168   /* No hardware instruction available; call a library routine.  */
5169     {
5170       rtx libfunc;
5171       rtx_insn *insns;
5172       rtx value;
5173       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
5174
5175       if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_PRECISION (SImode))
5176         from = convert_to_mode (SImode, from, unsignedp);
5177
5178       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5179       gcc_assert (libfunc);
5180
5181       start_sequence ();
5182
5183       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5184                                        GET_MODE (to), 1, from,
5185                                        GET_MODE (from));
5186       insns = get_insns ();
5187       end_sequence ();
5188
5189       emit_libcall_block (insns, target, value,
5190                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
5191                                          GET_MODE (to), from));
5192     }
5193
5194  done:
5195
5196   /* Copy result to requested destination
5197      if we have been computing in a temp location.  */
5198
5199   if (target != to)
5200     {
5201       if (GET_MODE (target) == GET_MODE (to))
5202         emit_move_insn (to, target);
5203       else
5204         convert_move (to, target, 0);
5205     }
5206 }
5207 \f
5208 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5209    must be floating point.  */
5210
5211 void
5212 expand_fix (rtx to, rtx from, int unsignedp)
5213 {
5214   enum insn_code icode;
5215   rtx target = to;
5216   machine_mode fmode, imode;
5217   int must_trunc = 0;
5218
5219   /* We first try to find a pair of modes, one real and one integer, at
5220      least as wide as FROM and TO, respectively, in which we can open-code
5221      this conversion.  If the integer mode is wider than the mode of TO,
5222      we can do the conversion either signed or unsigned.  */
5223
5224   for (fmode = GET_MODE (from); fmode != VOIDmode;
5225        fmode = GET_MODE_WIDER_MODE (fmode))
5226     for (imode = GET_MODE (to); imode != VOIDmode;
5227          imode = GET_MODE_WIDER_MODE (imode))
5228       {
5229         int doing_unsigned = unsignedp;
5230
5231         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
5232         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
5233           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
5234
5235         if (icode != CODE_FOR_nothing)
5236           {
5237             rtx_insn *last = get_last_insn ();
5238             if (fmode != GET_MODE (from))
5239               from = convert_to_mode (fmode, from, 0);
5240
5241             if (must_trunc)
5242               {
5243                 rtx temp = gen_reg_rtx (GET_MODE (from));
5244                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
5245                                     temp, 0);
5246               }
5247
5248             if (imode != GET_MODE (to))
5249               target = gen_reg_rtx (imode);
5250
5251             if (maybe_emit_unop_insn (icode, target, from,
5252                                       doing_unsigned ? UNSIGNED_FIX : FIX))
5253               {
5254                 if (target != to)
5255                   convert_move (to, target, unsignedp);
5256                 return;
5257               }
5258             delete_insns_since (last);
5259           }
5260       }
5261
5262   /* For an unsigned conversion, there is one more way to do it.
5263      If we have a signed conversion, we generate code that compares
5264      the real value to the largest representable positive number.  If if
5265      is smaller, the conversion is done normally.  Otherwise, subtract
5266      one plus the highest signed number, convert, and add it back.
5267
5268      We only need to check all real modes, since we know we didn't find
5269      anything with a wider integer mode.
5270
5271      This code used to extend FP value into mode wider than the destination.
5272      This is needed for decimal float modes which cannot accurately
5273      represent one plus the highest signed number of the same size, but
5274      not for binary modes.  Consider, for instance conversion from SFmode
5275      into DImode.
5276
5277      The hot path through the code is dealing with inputs smaller than 2^63
5278      and doing just the conversion, so there is no bits to lose.
5279
5280      In the other path we know the value is positive in the range 2^63..2^64-1
5281      inclusive.  (as for other input overflow happens and result is undefined)
5282      So we know that the most important bit set in mantissa corresponds to
5283      2^63.  The subtraction of 2^63 should not generate any rounding as it
5284      simply clears out that bit.  The rest is trivial.  */
5285
5286   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
5287     for (fmode = GET_MODE (from); fmode != VOIDmode;
5288          fmode = GET_MODE_WIDER_MODE (fmode))
5289       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
5290           && (!DECIMAL_FLOAT_MODE_P (fmode)
5291               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
5292         {
5293           int bitsize;
5294           REAL_VALUE_TYPE offset;
5295           rtx limit;
5296           rtx_code_label *lab1, *lab2;
5297           rtx_insn *insn;
5298
5299           bitsize = GET_MODE_PRECISION (GET_MODE (to));
5300           real_2expN (&offset, bitsize - 1, fmode);
5301           limit = CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode);
5302           lab1 = gen_label_rtx ();
5303           lab2 = gen_label_rtx ();
5304
5305           if (fmode != GET_MODE (from))
5306             from = convert_to_mode (fmode, from, 0);
5307
5308           /* See if we need to do the subtraction.  */
5309           do_pending_stack_adjust ();
5310           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
5311                                    0, lab1);
5312
5313           /* If not, do the signed "fix" and branch around fixup code.  */
5314           expand_fix (to, from, 0);
5315           emit_jump_insn (gen_jump (lab2));
5316           emit_barrier ();
5317
5318           /* Otherwise, subtract 2**(N-1), convert to signed number,
5319              then add 2**(N-1).  Do the addition using XOR since this
5320              will often generate better code.  */
5321           emit_label (lab1);
5322           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5323                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
5324           expand_fix (to, target, 0);
5325           target = expand_binop (GET_MODE (to), xor_optab, to,
5326                                  gen_int_mode
5327                                  ((HOST_WIDE_INT) 1 << (bitsize - 1),
5328                                   GET_MODE (to)),
5329                                  to, 1, OPTAB_LIB_WIDEN);
5330
5331           if (target != to)
5332             emit_move_insn (to, target);
5333
5334           emit_label (lab2);
5335
5336           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
5337             {
5338               /* Make a place for a REG_NOTE and add it.  */
5339               insn = emit_move_insn (to, to);
5340               set_dst_reg_note (insn, REG_EQUAL,
5341                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
5342                                                copy_rtx (from)),
5343                                 to);
5344             }
5345
5346           return;
5347         }
5348
5349   /* We can't do it with an insn, so use a library call.  But first ensure
5350      that the mode of TO is at least as wide as SImode, since those are the
5351      only library calls we know about.  */
5352
5353   if (GET_MODE_PRECISION (GET_MODE (to)) < GET_MODE_PRECISION (SImode))
5354     {
5355       target = gen_reg_rtx (SImode);
5356
5357       expand_fix (target, from, unsignedp);
5358     }
5359   else
5360     {
5361       rtx_insn *insns;
5362       rtx value;
5363       rtx libfunc;
5364
5365       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5366       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5367       gcc_assert (libfunc);
5368
5369       start_sequence ();
5370
5371       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5372                                        GET_MODE (to), 1, from,
5373                                        GET_MODE (from));
5374       insns = get_insns ();
5375       end_sequence ();
5376
5377       emit_libcall_block (insns, target, value,
5378                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5379                                          GET_MODE (to), from));
5380     }
5381
5382   if (target != to)
5383     {
5384       if (GET_MODE (to) == GET_MODE (target))
5385         emit_move_insn (to, target);
5386       else
5387         convert_move (to, target, 0);
5388     }
5389 }
5390
5391 /* Generate code to convert FROM or TO a fixed-point.
5392    If UINTP is true, either TO or FROM is an unsigned integer.
5393    If SATP is true, we need to saturate the result.  */
5394
5395 void
5396 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5397 {
5398   machine_mode to_mode = GET_MODE (to);
5399   machine_mode from_mode = GET_MODE (from);
5400   convert_optab tab;
5401   enum rtx_code this_code;
5402   enum insn_code code;
5403   rtx_insn *insns;
5404   rtx value;
5405   rtx libfunc;
5406
5407   if (to_mode == from_mode)
5408     {
5409       emit_move_insn (to, from);
5410       return;
5411     }
5412
5413   if (uintp)
5414     {
5415       tab = satp ? satfractuns_optab : fractuns_optab;
5416       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5417     }
5418   else
5419     {
5420       tab = satp ? satfract_optab : fract_optab;
5421       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5422     }
5423   code = convert_optab_handler (tab, to_mode, from_mode);
5424   if (code != CODE_FOR_nothing)
5425     {
5426       emit_unop_insn (code, to, from, this_code);
5427       return;
5428     }
5429
5430   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5431   gcc_assert (libfunc);
5432
5433   start_sequence ();
5434   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5435                                    1, from, from_mode);
5436   insns = get_insns ();
5437   end_sequence ();
5438
5439   emit_libcall_block (insns, to, value,
5440                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5441 }
5442
5443 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5444    must be floating point, TO must be signed.  Use the conversion optab
5445    TAB to do the conversion.  */
5446
5447 bool
5448 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5449 {
5450   enum insn_code icode;
5451   rtx target = to;
5452   machine_mode fmode, imode;
5453
5454   /* We first try to find a pair of modes, one real and one integer, at
5455      least as wide as FROM and TO, respectively, in which we can open-code
5456      this conversion.  If the integer mode is wider than the mode of TO,
5457      we can do the conversion either signed or unsigned.  */
5458
5459   for (fmode = GET_MODE (from); fmode != VOIDmode;
5460        fmode = GET_MODE_WIDER_MODE (fmode))
5461     for (imode = GET_MODE (to); imode != VOIDmode;
5462          imode = GET_MODE_WIDER_MODE (imode))
5463       {
5464         icode = convert_optab_handler (tab, imode, fmode);
5465         if (icode != CODE_FOR_nothing)
5466           {
5467             rtx_insn *last = get_last_insn ();
5468             if (fmode != GET_MODE (from))
5469               from = convert_to_mode (fmode, from, 0);
5470
5471             if (imode != GET_MODE (to))
5472               target = gen_reg_rtx (imode);
5473
5474             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5475               {
5476                 delete_insns_since (last);
5477                 continue;
5478               }
5479             if (target != to)
5480               convert_move (to, target, 0);
5481             return true;
5482           }
5483       }
5484
5485   return false;
5486 }
5487 \f
5488 /* Report whether we have an instruction to perform the operation
5489    specified by CODE on operands of mode MODE.  */
5490 int
5491 have_insn_for (enum rtx_code code, machine_mode mode)
5492 {
5493   return (code_to_optab (code)
5494           && (optab_handler (code_to_optab (code), mode)
5495               != CODE_FOR_nothing));
5496 }
5497
5498 /* Initialize the libfunc fields of an entire group of entries in some
5499    optab.  Each entry is set equal to a string consisting of a leading
5500    pair of underscores followed by a generic operation name followed by
5501    a mode name (downshifted to lowercase) followed by a single character
5502    representing the number of operands for the given operation (which is
5503    usually one of the characters '2', '3', or '4').
5504
5505    OPTABLE is the table in which libfunc fields are to be initialized.
5506    OPNAME is the generic (string) name of the operation.
5507    SUFFIX is the character which specifies the number of operands for
5508      the given generic operation.
5509    MODE is the mode to generate for.
5510 */
5511
5512 static void
5513 gen_libfunc (optab optable, const char *opname, int suffix,
5514              machine_mode mode)
5515 {
5516   unsigned opname_len = strlen (opname);
5517   const char *mname = GET_MODE_NAME (mode);
5518   unsigned mname_len = strlen (mname);
5519   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5520   int len = prefix_len + opname_len + mname_len + 1 + 1;
5521   char *libfunc_name = XALLOCAVEC (char, len);
5522   char *p;
5523   const char *q;
5524
5525   p = libfunc_name;
5526   *p++ = '_';
5527   *p++ = '_';
5528   if (targetm.libfunc_gnu_prefix)
5529     {
5530       *p++ = 'g';
5531       *p++ = 'n';
5532       *p++ = 'u';
5533       *p++ = '_';
5534     }
5535   for (q = opname; *q; )
5536     *p++ = *q++;
5537   for (q = mname; *q; q++)
5538     *p++ = TOLOWER (*q);
5539   *p++ = suffix;
5540   *p = '\0';
5541
5542   set_optab_libfunc (optable, mode,
5543                      ggc_alloc_string (libfunc_name, p - libfunc_name));
5544 }
5545
5546 /* Like gen_libfunc, but verify that integer operation is involved.  */
5547
5548 void
5549 gen_int_libfunc (optab optable, const char *opname, char suffix,
5550                  machine_mode mode)
5551 {
5552   int maxsize = 2 * BITS_PER_WORD;
5553   int minsize = BITS_PER_WORD;
5554
5555   if (GET_MODE_CLASS (mode) != MODE_INT)
5556     return;
5557   if (maxsize < LONG_LONG_TYPE_SIZE)
5558     maxsize = LONG_LONG_TYPE_SIZE;
5559   if (minsize > INT_TYPE_SIZE
5560       && (trapv_binoptab_p (optable)
5561           || trapv_unoptab_p (optable)))
5562     minsize = INT_TYPE_SIZE;
5563   if (GET_MODE_BITSIZE (mode) < minsize
5564       || GET_MODE_BITSIZE (mode) > maxsize)
5565     return;
5566   gen_libfunc (optable, opname, suffix, mode);
5567 }
5568
5569 /* Like gen_libfunc, but verify that FP and set decimal prefix if needed.  */
5570
5571 void
5572 gen_fp_libfunc (optab optable, const char *opname, char suffix,
5573                 machine_mode mode)
5574 {
5575   char *dec_opname;
5576
5577   if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5578     gen_libfunc (optable, opname, suffix, mode);
5579   if (DECIMAL_FLOAT_MODE_P (mode))
5580     {
5581       dec_opname = XALLOCAVEC (char, sizeof (DECIMAL_PREFIX) + strlen (opname));
5582       /* For BID support, change the name to have either a bid_ or dpd_ prefix
5583          depending on the low level floating format used.  */
5584       memcpy (dec_opname, DECIMAL_PREFIX, sizeof (DECIMAL_PREFIX) - 1);
5585       strcpy (dec_opname + sizeof (DECIMAL_PREFIX) - 1, opname);
5586       gen_libfunc (optable, dec_opname, suffix, mode);
5587     }
5588 }
5589
5590 /* Like gen_libfunc, but verify that fixed-point operation is involved.  */
5591
5592 void
5593 gen_fixed_libfunc (optab optable, const char *opname, char suffix,
5594                    machine_mode mode)
5595 {
5596   if (!ALL_FIXED_POINT_MODE_P (mode))
5597     return;
5598   gen_libfunc (optable, opname, suffix, mode);
5599 }
5600
5601 /* Like gen_libfunc, but verify that signed fixed-point operation is
5602    involved.  */
5603
5604 void
5605 gen_signed_fixed_libfunc (optab optable, const char *opname, char suffix,
5606                           machine_mode mode)
5607 {
5608   if (!SIGNED_FIXED_POINT_MODE_P (mode))
5609     return;
5610   gen_libfunc (optable, opname, suffix, mode);
5611 }
5612
5613 /* Like gen_libfunc, but verify that unsigned fixed-point operation is
5614    involved.  */
5615
5616 void
5617 gen_unsigned_fixed_libfunc (optab optable, const char *opname, char suffix,
5618                             machine_mode mode)
5619 {
5620   if (!UNSIGNED_FIXED_POINT_MODE_P (mode))
5621     return;
5622   gen_libfunc (optable, opname, suffix, mode);
5623 }
5624
5625 /* Like gen_libfunc, but verify that FP or INT operation is involved.  */
5626
5627 void
5628 gen_int_fp_libfunc (optab optable, const char *name, char suffix,
5629                     machine_mode mode)
5630 {
5631   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5632     gen_fp_libfunc (optable, name, suffix, mode);
5633   if (INTEGRAL_MODE_P (mode))
5634     gen_int_libfunc (optable, name, suffix, mode);
5635 }
5636
5637 /* Like gen_libfunc, but verify that FP or INT operation is involved
5638    and add 'v' suffix for integer operation.  */
5639
5640 void
5641 gen_intv_fp_libfunc (optab optable, const char *name, char suffix,
5642                      machine_mode mode)
5643 {
5644   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5645     gen_fp_libfunc (optable, name, suffix, mode);
5646   if (GET_MODE_CLASS (mode) == MODE_INT)
5647     {
5648       int len = strlen (name);
5649       char *v_name = XALLOCAVEC (char, len + 2);
5650       strcpy (v_name, name);
5651       v_name[len] = 'v';
5652       v_name[len + 1] = 0;
5653       gen_int_libfunc (optable, v_name, suffix, mode);
5654     }
5655 }
5656
5657 /* Like gen_libfunc, but verify that FP or INT or FIXED operation is
5658    involved.  */
5659
5660 void
5661 gen_int_fp_fixed_libfunc (optab optable, const char *name, char suffix,
5662                           machine_mode mode)
5663 {
5664   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5665     gen_fp_libfunc (optable, name, suffix, mode);
5666   if (INTEGRAL_MODE_P (mode))
5667     gen_int_libfunc (optable, name, suffix, mode);
5668   if (ALL_FIXED_POINT_MODE_P (mode))
5669     gen_fixed_libfunc (optable, name, suffix, mode);
5670 }
5671
5672 /* Like gen_libfunc, but verify that FP or INT or signed FIXED operation is
5673    involved.  */
5674
5675 void
5676 gen_int_fp_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5677                                  machine_mode mode)
5678 {
5679   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5680     gen_fp_libfunc (optable, name, suffix, mode);
5681   if (INTEGRAL_MODE_P (mode))
5682     gen_int_libfunc (optable, name, suffix, mode);
5683   if (SIGNED_FIXED_POINT_MODE_P (mode))
5684     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5685 }
5686
5687 /* Like gen_libfunc, but verify that INT or FIXED operation is
5688    involved.  */
5689
5690 void
5691 gen_int_fixed_libfunc (optab optable, const char *name, char suffix,
5692                        machine_mode mode)
5693 {
5694   if (INTEGRAL_MODE_P (mode))
5695     gen_int_libfunc (optable, name, suffix, mode);
5696   if (ALL_FIXED_POINT_MODE_P (mode))
5697     gen_fixed_libfunc (optable, name, suffix, mode);
5698 }
5699
5700 /* Like gen_libfunc, but verify that INT or signed FIXED operation is
5701    involved.  */
5702
5703 void
5704 gen_int_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5705                               machine_mode mode)
5706 {
5707   if (INTEGRAL_MODE_P (mode))
5708     gen_int_libfunc (optable, name, suffix, mode);
5709   if (SIGNED_FIXED_POINT_MODE_P (mode))
5710     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5711 }
5712
5713 /* Like gen_libfunc, but verify that INT or unsigned FIXED operation is
5714    involved.  */
5715
5716 void
5717 gen_int_unsigned_fixed_libfunc (optab optable, const char *name, char suffix,
5718                                 machine_mode mode)
5719 {
5720   if (INTEGRAL_MODE_P (mode))
5721     gen_int_libfunc (optable, name, suffix, mode);
5722   if (UNSIGNED_FIXED_POINT_MODE_P (mode))
5723     gen_unsigned_fixed_libfunc (optable, name, suffix, mode);
5724 }
5725
5726 /* Initialize the libfunc fields of an entire group of entries of an
5727    inter-mode-class conversion optab.  The string formation rules are
5728    similar to the ones for init_libfuncs, above, but instead of having
5729    a mode name and an operand count these functions have two mode names
5730    and no operand count.  */
5731
5732 void
5733 gen_interclass_conv_libfunc (convert_optab tab,
5734                              const char *opname,
5735                              machine_mode tmode,
5736                              machine_mode fmode)
5737 {
5738   size_t opname_len = strlen (opname);
5739   size_t mname_len = 0;
5740
5741   const char *fname, *tname;
5742   const char *q;
5743   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5744   char *libfunc_name, *suffix;
5745   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5746   char *p;
5747
5748   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5749      depends on which underlying decimal floating point format is used.  */
5750   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5751
5752   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5753
5754   nondec_name = XALLOCAVEC (char, prefix_len + opname_len + mname_len + 1 + 1);
5755   nondec_name[0] = '_';
5756   nondec_name[1] = '_';
5757   if (targetm.libfunc_gnu_prefix)
5758     {
5759       nondec_name[2] = 'g';
5760       nondec_name[3] = 'n';
5761       nondec_name[4] = 'u';
5762       nondec_name[5] = '_';
5763     }
5764
5765   memcpy (&nondec_name[prefix_len], opname, opname_len);
5766   nondec_suffix = nondec_name + opname_len + prefix_len;
5767
5768   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5769   dec_name[0] = '_';
5770   dec_name[1] = '_';
5771   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5772   memcpy (&dec_name[2+dec_len], opname, opname_len);
5773   dec_suffix = dec_name + dec_len + opname_len + 2;
5774
5775   fname = GET_MODE_NAME (fmode);
5776   tname = GET_MODE_NAME (tmode);
5777
5778   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5779     {
5780       libfunc_name = dec_name;
5781       suffix = dec_suffix;
5782     }
5783   else
5784     {
5785       libfunc_name = nondec_name;
5786       suffix = nondec_suffix;
5787     }
5788
5789   p = suffix;
5790   for (q = fname; *q; p++, q++)
5791     *p = TOLOWER (*q);
5792   for (q = tname; *q; p++, q++)
5793     *p = TOLOWER (*q);
5794
5795   *p = '\0';
5796
5797   set_conv_libfunc (tab, tmode, fmode,
5798                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5799 }
5800
5801 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5802    int->fp conversion.  */
5803
5804 void
5805 gen_int_to_fp_conv_libfunc (convert_optab tab,
5806                             const char *opname,
5807                             machine_mode tmode,
5808                             machine_mode fmode)
5809 {
5810   if (GET_MODE_CLASS (fmode) != MODE_INT)
5811     return;
5812   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5813     return;
5814   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5815 }
5816
5817 /* ufloat_optab is special by using floatun for FP and floatuns decimal fp
5818    naming scheme.  */
5819
5820 void
5821 gen_ufloat_conv_libfunc (convert_optab tab,
5822                          const char *opname ATTRIBUTE_UNUSED,
5823                          machine_mode tmode,
5824                          machine_mode fmode)
5825 {
5826   if (DECIMAL_FLOAT_MODE_P (tmode))
5827     gen_int_to_fp_conv_libfunc (tab, "floatuns", tmode, fmode);
5828   else
5829     gen_int_to_fp_conv_libfunc (tab, "floatun", tmode, fmode);
5830 }
5831
5832 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5833    fp->int conversion.  */
5834
5835 void
5836 gen_int_to_fp_nondecimal_conv_libfunc (convert_optab tab,
5837                                        const char *opname,
5838                                        machine_mode tmode,
5839                                        machine_mode fmode)
5840 {
5841   if (GET_MODE_CLASS (fmode) != MODE_INT)
5842     return;
5843   if (GET_MODE_CLASS (tmode) != MODE_FLOAT)
5844     return;
5845   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5846 }
5847
5848 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5849    fp->int conversion with no decimal floating point involved.  */
5850
5851 void
5852 gen_fp_to_int_conv_libfunc (convert_optab tab,
5853                             const char *opname,
5854                             machine_mode tmode,
5855                             machine_mode fmode)
5856 {
5857   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5858     return;
5859   if (GET_MODE_CLASS (tmode) != MODE_INT)
5860     return;
5861   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5862 }
5863
5864 /* Initialize the libfunc fields of an of an intra-mode-class conversion optab.
5865    The string formation rules are
5866    similar to the ones for init_libfunc, above.  */
5867
5868 void
5869 gen_intraclass_conv_libfunc (convert_optab tab, const char *opname,
5870                              machine_mode tmode, machine_mode fmode)
5871 {
5872   size_t opname_len = strlen (opname);
5873   size_t mname_len = 0;
5874
5875   const char *fname, *tname;
5876   const char *q;
5877   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5878   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5879   char *libfunc_name, *suffix;
5880   char *p;
5881
5882   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5883      depends on which underlying decimal floating point format is used.  */
5884   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5885
5886   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5887
5888   nondec_name = XALLOCAVEC (char, 2 + opname_len + mname_len + 1 + 1);
5889   nondec_name[0] = '_';
5890   nondec_name[1] = '_';
5891   if (targetm.libfunc_gnu_prefix)
5892     {
5893       nondec_name[2] = 'g';
5894       nondec_name[3] = 'n';
5895       nondec_name[4] = 'u';
5896       nondec_name[5] = '_';
5897     }
5898   memcpy (&nondec_name[prefix_len], opname, opname_len);
5899   nondec_suffix = nondec_name + opname_len + prefix_len;
5900
5901   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5902   dec_name[0] = '_';
5903   dec_name[1] = '_';
5904   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5905   memcpy (&dec_name[2 + dec_len], opname, opname_len);
5906   dec_suffix = dec_name + dec_len + opname_len + 2;
5907
5908   fname = GET_MODE_NAME (fmode);
5909   tname = GET_MODE_NAME (tmode);
5910
5911   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5912     {
5913       libfunc_name = dec_name;
5914       suffix = dec_suffix;
5915     }
5916   else
5917     {
5918       libfunc_name = nondec_name;
5919       suffix = nondec_suffix;
5920     }
5921
5922   p = suffix;
5923   for (q = fname; *q; p++, q++)
5924     *p = TOLOWER (*q);
5925   for (q = tname; *q; p++, q++)
5926     *p = TOLOWER (*q);
5927
5928   *p++ = '2';
5929   *p = '\0';
5930
5931   set_conv_libfunc (tab, tmode, fmode,
5932                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5933 }
5934
5935 /* Pick proper libcall for trunc_optab.  We need to chose if we do
5936    truncation or extension and interclass or intraclass.  */
5937
5938 void
5939 gen_trunc_conv_libfunc (convert_optab tab,
5940                          const char *opname,
5941                          machine_mode tmode,
5942                          machine_mode fmode)
5943 {
5944   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5945     return;
5946   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5947     return;
5948   if (tmode == fmode)
5949     return;
5950
5951   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5952       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5953      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5954
5955   if (GET_MODE_PRECISION (fmode) <= GET_MODE_PRECISION (tmode))
5956     return;
5957
5958   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5959        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5960       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5961     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5962 }
5963
5964 /* Pick proper libcall for extend_optab.  We need to chose if we do
5965    truncation or extension and interclass or intraclass.  */
5966
5967 void
5968 gen_extend_conv_libfunc (convert_optab tab,
5969                          const char *opname ATTRIBUTE_UNUSED,
5970                          machine_mode tmode,
5971                          machine_mode fmode)
5972 {
5973   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5974     return;
5975   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5976     return;
5977   if (tmode == fmode)
5978     return;
5979
5980   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5981       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5982      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5983
5984   if (GET_MODE_PRECISION (fmode) > GET_MODE_PRECISION (tmode))
5985     return;
5986
5987   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5988        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5989       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5990     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5991 }
5992
5993 /* Pick proper libcall for fract_optab.  We need to chose if we do
5994    interclass or intraclass.  */
5995
5996 void
5997 gen_fract_conv_libfunc (convert_optab tab,
5998                         const char *opname,
5999                         machine_mode tmode,
6000                         machine_mode fmode)
6001 {
6002   if (tmode == fmode)
6003     return;
6004   if (!(ALL_FIXED_POINT_MODE_P (tmode) || ALL_FIXED_POINT_MODE_P (fmode)))
6005     return;
6006
6007   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6008     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6009   else
6010     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6011 }
6012
6013 /* Pick proper libcall for fractuns_optab.  */
6014
6015 void
6016 gen_fractuns_conv_libfunc (convert_optab tab,
6017                            const char *opname,
6018                            machine_mode tmode,
6019                            machine_mode fmode)
6020 {
6021   if (tmode == fmode)
6022     return;
6023   /* One mode must be a fixed-point mode, and the other must be an integer
6024      mode. */
6025   if (!((ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT)
6026         || (ALL_FIXED_POINT_MODE_P (fmode)
6027             && GET_MODE_CLASS (tmode) == MODE_INT)))
6028     return;
6029
6030   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6031 }
6032
6033 /* Pick proper libcall for satfract_optab.  We need to chose if we do
6034    interclass or intraclass.  */
6035
6036 void
6037 gen_satfract_conv_libfunc (convert_optab tab,
6038                            const char *opname,
6039                            machine_mode tmode,
6040                            machine_mode fmode)
6041 {
6042   if (tmode == fmode)
6043     return;
6044   /* TMODE must be a fixed-point mode.  */
6045   if (!ALL_FIXED_POINT_MODE_P (tmode))
6046     return;
6047
6048   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6049     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6050   else
6051     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6052 }
6053
6054 /* Pick proper libcall for satfractuns_optab.  */
6055
6056 void
6057 gen_satfractuns_conv_libfunc (convert_optab tab,
6058                               const char *opname,
6059                               machine_mode tmode,
6060                               machine_mode fmode)
6061 {
6062   if (tmode == fmode)
6063     return;
6064   /* TMODE must be a fixed-point mode, and FMODE must be an integer mode. */
6065   if (!(ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT))
6066     return;
6067
6068   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6069 }
6070
6071 /* Hashtable callbacks for libfunc_decls.  */
6072
6073 struct libfunc_decl_hasher : ggc_hasher<tree>
6074 {
6075   static hashval_t
6076   hash (tree entry)
6077   {
6078     return IDENTIFIER_HASH_VALUE (DECL_NAME (entry));
6079   }
6080
6081   static bool
6082   equal (tree decl, tree name)
6083   {
6084     return DECL_NAME (decl) == name;
6085   }
6086 };
6087
6088 /* A table of previously-created libfuncs, hashed by name.  */
6089 static GTY (()) hash_table<libfunc_decl_hasher> *libfunc_decls;
6090
6091 /* Build a decl for a libfunc named NAME. */
6092
6093 tree
6094 build_libfunc_function (const char *name)
6095 {
6096   tree decl = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL,
6097                           get_identifier (name),
6098                           build_function_type (integer_type_node, NULL_TREE));
6099   /* ??? We don't have any type information except for this is
6100      a function.  Pretend this is "int foo()".  */
6101   DECL_ARTIFICIAL (decl) = 1;
6102   DECL_EXTERNAL (decl) = 1;
6103   TREE_PUBLIC (decl) = 1;
6104   gcc_assert (DECL_ASSEMBLER_NAME (decl));
6105
6106   /* Zap the nonsensical SYMBOL_REF_DECL for this.  What we're left with
6107      are the flags assigned by targetm.encode_section_info.  */
6108   SET_SYMBOL_REF_DECL (XEXP (DECL_RTL (decl), 0), NULL);
6109
6110   return decl;
6111 }
6112
6113 rtx
6114 init_one_libfunc (const char *name)
6115 {
6116   tree id, decl;
6117   hashval_t hash;
6118
6119   if (libfunc_decls == NULL)
6120     libfunc_decls = hash_table<libfunc_decl_hasher>::create_ggc (37);
6121
6122   /* See if we have already created a libfunc decl for this function.  */
6123   id = get_identifier (name);
6124   hash = IDENTIFIER_HASH_VALUE (id);
6125   tree *slot = libfunc_decls->find_slot_with_hash (id, hash, INSERT);
6126   decl = *slot;
6127   if (decl == NULL)
6128     {
6129       /* Create a new decl, so that it can be passed to
6130          targetm.encode_section_info.  */
6131       decl = build_libfunc_function (name);
6132       *slot = decl;
6133     }
6134   return XEXP (DECL_RTL (decl), 0);
6135 }
6136
6137 /* Adjust the assembler name of libfunc NAME to ASMSPEC.  */
6138
6139 rtx
6140 set_user_assembler_libfunc (const char *name, const char *asmspec)
6141 {
6142   tree id, decl;
6143   hashval_t hash;
6144
6145   id = get_identifier (name);
6146   hash = IDENTIFIER_HASH_VALUE (id);
6147   tree *slot = libfunc_decls->find_slot_with_hash (id, hash, NO_INSERT);
6148   gcc_assert (slot);
6149   decl = (tree) *slot;
6150   set_user_assembler_name (decl, asmspec);
6151   return XEXP (DECL_RTL (decl), 0);
6152 }
6153
6154 /* Call this to reset the function entry for one optab (OPTABLE) in mode
6155    MODE to NAME, which should be either 0 or a string constant.  */
6156 void
6157 set_optab_libfunc (optab op, machine_mode mode, const char *name)
6158 {
6159   rtx val;
6160   struct libfunc_entry e;
6161   struct libfunc_entry **slot;
6162
6163   e.op = op;
6164   e.mode1 = mode;
6165   e.mode2 = VOIDmode;
6166
6167   if (name)
6168     val = init_one_libfunc (name);
6169   else
6170     val = 0;
6171   slot = libfunc_hash->find_slot (&e, INSERT);
6172   if (*slot == NULL)
6173     *slot = ggc_alloc<libfunc_entry> ();
6174   (*slot)->op = op;
6175   (*slot)->mode1 = mode;
6176   (*slot)->mode2 = VOIDmode;
6177   (*slot)->libfunc = val;
6178 }
6179
6180 /* Call this to reset the function entry for one conversion optab
6181    (OPTABLE) from mode FMODE to mode TMODE to NAME, which should be
6182    either 0 or a string constant.  */
6183 void
6184 set_conv_libfunc (convert_optab optab, machine_mode tmode,
6185                   machine_mode fmode, const char *name)
6186 {
6187   rtx val;
6188   struct libfunc_entry e;
6189   struct libfunc_entry **slot;
6190
6191   e.op = optab;
6192   e.mode1 = tmode;
6193   e.mode2 = fmode;
6194
6195   if (name)
6196     val = init_one_libfunc (name);
6197   else
6198     val = 0;
6199   slot = libfunc_hash->find_slot (&e, INSERT);
6200   if (*slot == NULL)
6201     *slot = ggc_alloc<libfunc_entry> ();
6202   (*slot)->op = optab;
6203   (*slot)->mode1 = tmode;
6204   (*slot)->mode2 = fmode;
6205   (*slot)->libfunc = val;
6206 }
6207
6208 /* Call this to initialize the contents of the optabs
6209    appropriately for the current target machine.  */
6210
6211 void
6212 init_optabs (void)
6213 {
6214   if (libfunc_hash)
6215     libfunc_hash->empty ();
6216   else
6217     libfunc_hash = hash_table<libfunc_hasher>::create_ggc (10);
6218
6219   /* Fill in the optabs with the insns we support.  */
6220   init_all_optabs (this_fn_optabs);
6221
6222   /* The ffs function operates on `int'.  Fall back on it if we do not
6223      have a libgcc2 function for that width.  */
6224   if (INT_TYPE_SIZE < BITS_PER_WORD)
6225     set_optab_libfunc (ffs_optab, mode_for_size (INT_TYPE_SIZE, MODE_INT, 0),
6226                        "ffs");
6227
6228   /* Explicitly initialize the bswap libfuncs since we need them to be
6229      valid for things other than word_mode.  */
6230   if (targetm.libfunc_gnu_prefix)
6231     {
6232       set_optab_libfunc (bswap_optab, SImode, "__gnu_bswapsi2");
6233       set_optab_libfunc (bswap_optab, DImode, "__gnu_bswapdi2");
6234     }
6235   else
6236     {
6237       set_optab_libfunc (bswap_optab, SImode, "__bswapsi2");
6238       set_optab_libfunc (bswap_optab, DImode, "__bswapdi2");
6239     }
6240
6241   /* Use cabs for double complex abs, since systems generally have cabs.
6242      Don't define any libcall for float complex, so that cabs will be used.  */
6243   if (complex_double_type_node)
6244     set_optab_libfunc (abs_optab, TYPE_MODE (complex_double_type_node),
6245                        "cabs");
6246
6247   abort_libfunc = init_one_libfunc ("abort");
6248   memcpy_libfunc = init_one_libfunc ("memcpy");
6249   memmove_libfunc = init_one_libfunc ("memmove");
6250   memcmp_libfunc = init_one_libfunc ("memcmp");
6251   memset_libfunc = init_one_libfunc ("memset");
6252   setbits_libfunc = init_one_libfunc ("__setbits");
6253
6254 #ifndef DONT_USE_BUILTIN_SETJMP
6255   setjmp_libfunc = init_one_libfunc ("__builtin_setjmp");
6256   longjmp_libfunc = init_one_libfunc ("__builtin_longjmp");
6257 #else
6258   setjmp_libfunc = init_one_libfunc ("setjmp");
6259   longjmp_libfunc = init_one_libfunc ("longjmp");
6260 #endif
6261   unwind_sjlj_register_libfunc = init_one_libfunc ("_Unwind_SjLj_Register");
6262   unwind_sjlj_unregister_libfunc
6263     = init_one_libfunc ("_Unwind_SjLj_Unregister");
6264
6265   /* For function entry/exit instrumentation.  */
6266   profile_function_entry_libfunc
6267     = init_one_libfunc ("__cyg_profile_func_enter");
6268   profile_function_exit_libfunc
6269     = init_one_libfunc ("__cyg_profile_func_exit");
6270
6271   gcov_flush_libfunc = init_one_libfunc ("__gcov_flush");
6272
6273   /* Allow the target to add more libcalls or rename some, etc.  */
6274   targetm.init_libfuncs ();
6275 }
6276
6277 /* Use the current target and options to initialize
6278    TREE_OPTIMIZATION_OPTABS (OPTNODE).  */
6279
6280 void
6281 init_tree_optimization_optabs (tree optnode)
6282 {
6283   /* Quick exit if we have already computed optabs for this target.  */
6284   if (TREE_OPTIMIZATION_BASE_OPTABS (optnode) == this_target_optabs)
6285     return;
6286
6287   /* Forget any previous information and set up for the current target.  */
6288   TREE_OPTIMIZATION_BASE_OPTABS (optnode) = this_target_optabs;
6289   struct target_optabs *tmp_optabs = (struct target_optabs *)
6290     TREE_OPTIMIZATION_OPTABS (optnode);
6291   if (tmp_optabs)
6292     memset (tmp_optabs, 0, sizeof (struct target_optabs));
6293   else
6294     tmp_optabs = ggc_alloc<target_optabs> ();
6295
6296   /* Generate a new set of optabs into tmp_optabs.  */
6297   init_all_optabs (tmp_optabs);
6298
6299   /* If the optabs changed, record it.  */
6300   if (memcmp (tmp_optabs, this_target_optabs, sizeof (struct target_optabs)))
6301     TREE_OPTIMIZATION_OPTABS (optnode) = tmp_optabs;
6302   else
6303     {
6304       TREE_OPTIMIZATION_OPTABS (optnode) = NULL;
6305       ggc_free (tmp_optabs);
6306     }
6307 }
6308
6309 /* A helper function for init_sync_libfuncs.  Using the basename BASE,
6310    install libfuncs into TAB for BASE_N for 1 <= N <= MAX.  */
6311
6312 static void
6313 init_sync_libfuncs_1 (optab tab, const char *base, int max)
6314 {
6315   machine_mode mode;
6316   char buf[64];
6317   size_t len = strlen (base);
6318   int i;
6319
6320   gcc_assert (max <= 8);
6321   gcc_assert (len + 3 < sizeof (buf));
6322
6323   memcpy (buf, base, len);
6324   buf[len] = '_';
6325   buf[len + 1] = '0';
6326   buf[len + 2] = '\0';
6327
6328   mode = QImode;
6329   for (i = 1; i <= max; i *= 2)
6330     {
6331       buf[len + 1] = '0' + i;
6332       set_optab_libfunc (tab, mode, buf);
6333       mode = GET_MODE_2XWIDER_MODE (mode);
6334     }
6335 }
6336
6337 void
6338 init_sync_libfuncs (int max)
6339 {
6340   if (!flag_sync_libcalls)
6341     return;
6342
6343   init_sync_libfuncs_1 (sync_compare_and_swap_optab,
6344                         "__sync_val_compare_and_swap", max);
6345   init_sync_libfuncs_1 (sync_lock_test_and_set_optab,
6346                         "__sync_lock_test_and_set", max);
6347
6348   init_sync_libfuncs_1 (sync_old_add_optab, "__sync_fetch_and_add", max);
6349   init_sync_libfuncs_1 (sync_old_sub_optab, "__sync_fetch_and_sub", max);
6350   init_sync_libfuncs_1 (sync_old_ior_optab, "__sync_fetch_and_or", max);
6351   init_sync_libfuncs_1 (sync_old_and_optab, "__sync_fetch_and_and", max);
6352   init_sync_libfuncs_1 (sync_old_xor_optab, "__sync_fetch_and_xor", max);
6353   init_sync_libfuncs_1 (sync_old_nand_optab, "__sync_fetch_and_nand", max);
6354
6355   init_sync_libfuncs_1 (sync_new_add_optab, "__sync_add_and_fetch", max);
6356   init_sync_libfuncs_1 (sync_new_sub_optab, "__sync_sub_and_fetch", max);
6357   init_sync_libfuncs_1 (sync_new_ior_optab, "__sync_or_and_fetch", max);
6358   init_sync_libfuncs_1 (sync_new_and_optab, "__sync_and_and_fetch", max);
6359   init_sync_libfuncs_1 (sync_new_xor_optab, "__sync_xor_and_fetch", max);
6360   init_sync_libfuncs_1 (sync_new_nand_optab, "__sync_nand_and_fetch", max);
6361 }
6362
6363 /* Print information about the current contents of the optabs on
6364    STDERR.  */
6365
6366 DEBUG_FUNCTION void
6367 debug_optab_libfuncs (void)
6368 {
6369   int i, j, k;
6370
6371   /* Dump the arithmetic optabs.  */
6372   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
6373     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6374       {
6375         rtx l = optab_libfunc ((optab) i, (machine_mode) j);
6376         if (l)
6377           {
6378             gcc_assert (GET_CODE (l) == SYMBOL_REF);
6379             fprintf (stderr, "%s\t%s:\t%s\n",
6380                      GET_RTX_NAME (optab_to_code ((optab) i)),
6381                      GET_MODE_NAME (j),
6382                      XSTR (l, 0));
6383           }
6384       }
6385
6386   /* Dump the conversion optabs.  */
6387   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
6388     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6389       for (k = 0; k < NUM_MACHINE_MODES; ++k)
6390         {
6391           rtx l = convert_optab_libfunc ((optab) i, (machine_mode) j,
6392                                          (machine_mode) k);
6393           if (l)
6394             {
6395               gcc_assert (GET_CODE (l) == SYMBOL_REF);
6396               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
6397                        GET_RTX_NAME (optab_to_code ((optab) i)),
6398                        GET_MODE_NAME (j),
6399                        GET_MODE_NAME (k),
6400                        XSTR (l, 0));
6401             }
6402         }
6403 }
6404
6405 \f
6406 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
6407    CODE.  Return 0 on failure.  */
6408
6409 rtx
6410 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
6411 {
6412   machine_mode mode = GET_MODE (op1);
6413   enum insn_code icode;
6414   rtx insn;
6415   rtx trap_rtx;
6416
6417   if (mode == VOIDmode)
6418     return 0;
6419
6420   icode = optab_handler (ctrap_optab, mode);
6421   if (icode == CODE_FOR_nothing)
6422     return 0;
6423
6424   /* Some targets only accept a zero trap code.  */
6425   if (!insn_operand_matches (icode, 3, tcode))
6426     return 0;
6427
6428   do_pending_stack_adjust ();
6429   start_sequence ();
6430   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
6431                     &trap_rtx, &mode);
6432   if (!trap_rtx)
6433     insn = NULL_RTX;
6434   else
6435     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
6436                             tcode);
6437
6438   /* If that failed, then give up.  */
6439   if (insn == 0)
6440     {
6441       end_sequence ();
6442       return 0;
6443     }
6444
6445   emit_insn (insn);
6446   insn = get_insns ();
6447   end_sequence ();
6448   return insn;
6449 }
6450
6451 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
6452    or unsigned operation code.  */
6453
6454 enum rtx_code
6455 get_rtx_code (enum tree_code tcode, bool unsignedp)
6456 {
6457   enum rtx_code code;
6458   switch (tcode)
6459     {
6460     case EQ_EXPR:
6461       code = EQ;
6462       break;
6463     case NE_EXPR:
6464       code = NE;
6465       break;
6466     case LT_EXPR:
6467       code = unsignedp ? LTU : LT;
6468       break;
6469     case LE_EXPR:
6470       code = unsignedp ? LEU : LE;
6471       break;
6472     case GT_EXPR:
6473       code = unsignedp ? GTU : GT;
6474       break;
6475     case GE_EXPR:
6476       code = unsignedp ? GEU : GE;
6477       break;
6478
6479     case UNORDERED_EXPR:
6480       code = UNORDERED;
6481       break;
6482     case ORDERED_EXPR:
6483       code = ORDERED;
6484       break;
6485     case UNLT_EXPR:
6486       code = UNLT;
6487       break;
6488     case UNLE_EXPR:
6489       code = UNLE;
6490       break;
6491     case UNGT_EXPR:
6492       code = UNGT;
6493       break;
6494     case UNGE_EXPR:
6495       code = UNGE;
6496       break;
6497     case UNEQ_EXPR:
6498       code = UNEQ;
6499       break;
6500     case LTGT_EXPR:
6501       code = LTGT;
6502       break;
6503
6504     case BIT_AND_EXPR:
6505       code = AND;
6506       break;
6507
6508     case BIT_IOR_EXPR:
6509       code = IOR;
6510       break;
6511
6512     default:
6513       gcc_unreachable ();
6514     }
6515   return code;
6516 }
6517
6518 /* Return comparison rtx for COND. Use UNSIGNEDP to select signed or
6519    unsigned operators. Do not generate compare instruction.  */
6520
6521 static rtx
6522 vector_compare_rtx (enum tree_code tcode, tree t_op0, tree t_op1,
6523                     bool unsignedp, enum insn_code icode)
6524 {
6525   struct expand_operand ops[2];
6526   rtx rtx_op0, rtx_op1;
6527   machine_mode m0, m1;
6528   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
6529
6530   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
6531
6532   /* Expand operands.  For vector types with scalar modes, e.g. where int64x1_t
6533      has mode DImode, this can produce a constant RTX of mode VOIDmode; in such
6534      cases, use the original mode.  */
6535   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
6536                          EXPAND_STACK_PARM);
6537   m0 = GET_MODE (rtx_op0);
6538   if (m0 == VOIDmode)
6539     m0 = TYPE_MODE (TREE_TYPE (t_op0));
6540
6541   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
6542                          EXPAND_STACK_PARM);
6543   m1 = GET_MODE (rtx_op1);
6544   if (m1 == VOIDmode)
6545     m1 = TYPE_MODE (TREE_TYPE (t_op1));
6546
6547   create_input_operand (&ops[0], rtx_op0, m0);
6548   create_input_operand (&ops[1], rtx_op1, m1);
6549   if (!maybe_legitimize_operands (icode, 4, 2, ops))
6550     gcc_unreachable ();
6551   return gen_rtx_fmt_ee (rcode, VOIDmode, ops[0].value, ops[1].value);
6552 }
6553
6554 /* Return true if VEC_PERM_EXPR of arbitrary input vectors can be expanded using
6555    SIMD extensions of the CPU.  SEL may be NULL, which stands for an unknown
6556    constant.  Note that additional permutations representing whole-vector shifts
6557    may also be handled via the vec_shr optab, but only where the second input
6558    vector is entirely constant zeroes; this case is not dealt with here.  */
6559
6560 bool
6561 can_vec_perm_p (machine_mode mode, bool variable,
6562                 const unsigned char *sel)
6563 {
6564   machine_mode qimode;
6565
6566   /* If the target doesn't implement a vector mode for the vector type,
6567      then no operations are supported.  */
6568   if (!VECTOR_MODE_P (mode))
6569     return false;
6570
6571   if (!variable)
6572     {
6573       if (direct_optab_handler (vec_perm_const_optab, mode) != CODE_FOR_nothing
6574           && (sel == NULL
6575               || targetm.vectorize.vec_perm_const_ok == NULL
6576               || targetm.vectorize.vec_perm_const_ok (mode, sel)))
6577         return true;
6578     }
6579
6580   if (direct_optab_handler (vec_perm_optab, mode) != CODE_FOR_nothing)
6581     return true;
6582
6583   /* We allow fallback to a QI vector mode, and adjust the mask.  */
6584   if (GET_MODE_INNER (mode) == QImode)
6585     return false;
6586   qimode = mode_for_vector (QImode, GET_MODE_SIZE (mode));
6587   if (!VECTOR_MODE_P (qimode))
6588     return false;
6589
6590   /* ??? For completeness, we ought to check the QImode version of
6591       vec_perm_const_optab.  But all users of this implicit lowering
6592       feature implement the variable vec_perm_optab.  */
6593   if (direct_optab_handler (vec_perm_optab, qimode) == CODE_FOR_nothing)
6594     return false;
6595
6596   /* In order to support the lowering of variable permutations,
6597      we need to support shifts and adds.  */
6598   if (variable)
6599     {
6600       if (GET_MODE_UNIT_SIZE (mode) > 2
6601           && optab_handler (ashl_optab, mode) == CODE_FOR_nothing
6602           && optab_handler (vashl_optab, mode) == CODE_FOR_nothing)
6603         return false;
6604       if (optab_handler (add_optab, qimode) == CODE_FOR_nothing)
6605         return false;
6606     }
6607
6608   return true;
6609 }
6610
6611 /* Checks if vec_perm mask SEL is a constant equivalent to a shift of the first
6612    vec_perm operand, assuming the second operand is a constant vector of zeroes.
6613    Return the shift distance in bits if so, or NULL_RTX if the vec_perm is not a
6614    shift.  */
6615 static rtx
6616 shift_amt_for_vec_perm_mask (rtx sel)
6617 {
6618   unsigned int i, first, nelt = GET_MODE_NUNITS (GET_MODE (sel));
6619   unsigned int bitsize = GET_MODE_BITSIZE (GET_MODE_INNER (GET_MODE (sel)));
6620
6621   if (GET_CODE (sel) != CONST_VECTOR)
6622     return NULL_RTX;
6623
6624   first = INTVAL (CONST_VECTOR_ELT (sel, 0));
6625   if (first >= 2*nelt)
6626     return NULL_RTX;
6627   for (i = 1; i < nelt; i++)
6628     {
6629       int idx = INTVAL (CONST_VECTOR_ELT (sel, i));
6630       unsigned int expected = (i + first) & (2 * nelt - 1);
6631       /* Indices into the second vector are all equivalent.  */
6632       if (idx < 0 || (MIN (nelt, (unsigned) idx) != MIN (nelt, expected)))
6633         return NULL_RTX;
6634     }
6635
6636   return GEN_INT (first * bitsize);
6637 }
6638
6639 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
6640
6641 static rtx
6642 expand_vec_perm_1 (enum insn_code icode, rtx target,
6643                    rtx v0, rtx v1, rtx sel)
6644 {
6645   machine_mode tmode = GET_MODE (target);
6646   machine_mode smode = GET_MODE (sel);
6647   struct expand_operand ops[4];
6648
6649   create_output_operand (&ops[0], target, tmode);
6650   create_input_operand (&ops[3], sel, smode);
6651
6652   /* Make an effort to preserve v0 == v1.  The target expander is able to
6653      rely on this to determine if we're permuting a single input operand.  */
6654   if (rtx_equal_p (v0, v1))
6655     {
6656       if (!insn_operand_matches (icode, 1, v0))
6657         v0 = force_reg (tmode, v0);
6658       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
6659       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
6660
6661       create_fixed_operand (&ops[1], v0);
6662       create_fixed_operand (&ops[2], v0);
6663     }
6664   else
6665     {
6666       create_input_operand (&ops[1], v0, tmode);
6667       /* See if this can be handled with a vec_shr.  We only do this if the
6668          second vector is all zeroes.  */
6669       enum insn_code shift_code = optab_handler (vec_shr_optab, GET_MODE (v0));
6670       if (v1 == CONST0_RTX (GET_MODE (v1)) && shift_code)
6671         if (rtx shift_amt = shift_amt_for_vec_perm_mask (sel))
6672           {
6673             create_convert_operand_from_type (&ops[2], shift_amt,
6674                                               sizetype_tab[(int) stk_sizetype]);
6675             if (maybe_expand_insn (shift_code, 3, ops))
6676               return ops[0].value;
6677           }
6678       create_input_operand (&ops[2], v1, tmode);
6679     }
6680
6681   if (maybe_expand_insn (icode, 4, ops))
6682     return ops[0].value;
6683   return NULL_RTX;
6684 }
6685
6686 /* Generate instructions for vec_perm optab given its mode
6687    and three operands.  */
6688
6689 rtx
6690 expand_vec_perm (machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
6691 {
6692   enum insn_code icode;
6693   machine_mode qimode;
6694   unsigned int i, w, e, u;
6695   rtx tmp, sel_qi = NULL;
6696   rtvec vec;
6697
6698   if (!target || GET_MODE (target) != mode)
6699     target = gen_reg_rtx (mode);
6700
6701   w = GET_MODE_SIZE (mode);
6702   e = GET_MODE_NUNITS (mode);
6703   u = GET_MODE_UNIT_SIZE (mode);
6704
6705   /* Set QIMODE to a different vector mode with byte elements.
6706      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
6707   qimode = VOIDmode;
6708   if (GET_MODE_INNER (mode) != QImode)
6709     {
6710       qimode = mode_for_vector (QImode, w);
6711       if (!VECTOR_MODE_P (qimode))
6712         qimode = VOIDmode;
6713     }
6714
6715   /* If the input is a constant, expand it specially.  */
6716   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
6717   if (GET_CODE (sel) == CONST_VECTOR)
6718     {
6719       icode = direct_optab_handler (vec_perm_const_optab, mode);
6720       if (icode != CODE_FOR_nothing)
6721         {
6722           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6723           if (tmp)
6724             return tmp;
6725         }
6726
6727       /* Fall back to a constant byte-based permutation.  */
6728       if (qimode != VOIDmode)
6729         {
6730           vec = rtvec_alloc (w);
6731           for (i = 0; i < e; ++i)
6732             {
6733               unsigned int j, this_e;
6734
6735               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
6736               this_e &= 2 * e - 1;
6737               this_e *= u;
6738
6739               for (j = 0; j < u; ++j)
6740                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
6741             }
6742           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
6743
6744           icode = direct_optab_handler (vec_perm_const_optab, qimode);
6745           if (icode != CODE_FOR_nothing)
6746             {
6747               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6748               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6749                                        gen_lowpart (qimode, v1), sel_qi);
6750               if (tmp)
6751                 return gen_lowpart (mode, tmp);
6752             }
6753         }
6754     }
6755
6756   /* Otherwise expand as a fully variable permuation.  */
6757   icode = direct_optab_handler (vec_perm_optab, mode);
6758   if (icode != CODE_FOR_nothing)
6759     {
6760       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6761       if (tmp)
6762         return tmp;
6763     }
6764
6765   /* As a special case to aid several targets, lower the element-based
6766      permutation to a byte-based permutation and try again.  */
6767   if (qimode == VOIDmode)
6768     return NULL_RTX;
6769   icode = direct_optab_handler (vec_perm_optab, qimode);
6770   if (icode == CODE_FOR_nothing)
6771     return NULL_RTX;
6772
6773   if (sel_qi == NULL)
6774     {
6775       /* Multiply each element by its byte size.  */
6776       machine_mode selmode = GET_MODE (sel);
6777       if (u == 2)
6778         sel = expand_simple_binop (selmode, PLUS, sel, sel,
6779                                    NULL, 0, OPTAB_DIRECT);
6780       else
6781         sel = expand_simple_binop (selmode, ASHIFT, sel,
6782                                    GEN_INT (exact_log2 (u)),
6783                                    NULL, 0, OPTAB_DIRECT);
6784       gcc_assert (sel != NULL);
6785
6786       /* Broadcast the low byte each element into each of its bytes.  */
6787       vec = rtvec_alloc (w);
6788       for (i = 0; i < w; ++i)
6789         {
6790           int this_e = i / u * u;
6791           if (BYTES_BIG_ENDIAN)
6792             this_e += u - 1;
6793           RTVEC_ELT (vec, i) = GEN_INT (this_e);
6794         }
6795       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6796       sel = gen_lowpart (qimode, sel);
6797       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
6798       gcc_assert (sel != NULL);
6799
6800       /* Add the byte offset to each byte element.  */
6801       /* Note that the definition of the indicies here is memory ordering,
6802          so there should be no difference between big and little endian.  */
6803       vec = rtvec_alloc (w);
6804       for (i = 0; i < w; ++i)
6805         RTVEC_ELT (vec, i) = GEN_INT (i % u);
6806       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6807       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
6808                                     sel, 0, OPTAB_DIRECT);
6809       gcc_assert (sel_qi != NULL);
6810     }
6811
6812   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6813   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6814                            gen_lowpart (qimode, v1), sel_qi);
6815   if (tmp)
6816     tmp = gen_lowpart (mode, tmp);
6817   return tmp;
6818 }
6819
6820 /* Return insn code for a conditional operator with a comparison in
6821    mode CMODE, unsigned if UNS is true, resulting in a value of mode VMODE.  */
6822
6823 static inline enum insn_code
6824 get_vcond_icode (machine_mode vmode, machine_mode cmode, bool uns)
6825 {
6826   enum insn_code icode = CODE_FOR_nothing;
6827   if (uns)
6828     icode = convert_optab_handler (vcondu_optab, vmode, cmode);
6829   else
6830     icode = convert_optab_handler (vcond_optab, vmode, cmode);
6831   return icode;
6832 }
6833
6834 /* Return TRUE iff, appropriate vector insns are available
6835    for vector cond expr with vector type VALUE_TYPE and a comparison
6836    with operand vector types in CMP_OP_TYPE.  */
6837
6838 bool
6839 expand_vec_cond_expr_p (tree value_type, tree cmp_op_type)
6840 {
6841   machine_mode value_mode = TYPE_MODE (value_type);
6842   machine_mode cmp_op_mode = TYPE_MODE (cmp_op_type);
6843   if (GET_MODE_SIZE (value_mode) != GET_MODE_SIZE (cmp_op_mode)
6844       || GET_MODE_NUNITS (value_mode) != GET_MODE_NUNITS (cmp_op_mode)
6845       || get_vcond_icode (TYPE_MODE (value_type), TYPE_MODE (cmp_op_type),
6846                           TYPE_UNSIGNED (cmp_op_type)) == CODE_FOR_nothing)
6847     return false;
6848   return true;
6849 }
6850
6851 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
6852    three operands.  */
6853
6854 rtx
6855 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
6856                       rtx target)
6857 {
6858   struct expand_operand ops[6];
6859   enum insn_code icode;
6860   rtx comparison, rtx_op1, rtx_op2;
6861   machine_mode mode = TYPE_MODE (vec_cond_type);
6862   machine_mode cmp_op_mode;
6863   bool unsignedp;
6864   tree op0a, op0b;
6865   enum tree_code tcode;
6866
6867   if (COMPARISON_CLASS_P (op0))
6868     {
6869       op0a = TREE_OPERAND (op0, 0);
6870       op0b = TREE_OPERAND (op0, 1);
6871       tcode = TREE_CODE (op0);
6872     }
6873   else
6874     {
6875       /* Fake op0 < 0.  */
6876       gcc_assert (!TYPE_UNSIGNED (TREE_TYPE (op0)));
6877       op0a = op0;
6878       op0b = build_zero_cst (TREE_TYPE (op0));
6879       tcode = LT_EXPR;
6880     }
6881   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
6882   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
6883
6884
6885   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
6886               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
6887
6888   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
6889   if (icode == CODE_FOR_nothing)
6890     return 0;
6891
6892   comparison = vector_compare_rtx (tcode, op0a, op0b, unsignedp, icode);
6893   rtx_op1 = expand_normal (op1);
6894   rtx_op2 = expand_normal (op2);
6895
6896   create_output_operand (&ops[0], target, mode);
6897   create_input_operand (&ops[1], rtx_op1, mode);
6898   create_input_operand (&ops[2], rtx_op2, mode);
6899   create_fixed_operand (&ops[3], comparison);
6900   create_fixed_operand (&ops[4], XEXP (comparison, 0));
6901   create_fixed_operand (&ops[5], XEXP (comparison, 1));
6902   expand_insn (icode, 6, ops);
6903   return ops[0].value;
6904 }
6905
6906 /* Return non-zero if a highpart multiply is supported of can be synthisized.
6907    For the benefit of expand_mult_highpart, the return value is 1 for direct,
6908    2 for even/odd widening, and 3 for hi/lo widening.  */
6909
6910 int
6911 can_mult_highpart_p (machine_mode mode, bool uns_p)
6912 {
6913   optab op;
6914   unsigned char *sel;
6915   unsigned i, nunits;
6916
6917   op = uns_p ? umul_highpart_optab : smul_highpart_optab;
6918   if (optab_handler (op, mode) != CODE_FOR_nothing)
6919     return 1;
6920
6921   /* If the mode is an integral vector, synth from widening operations.  */
6922   if (GET_MODE_CLASS (mode) != MODE_VECTOR_INT)
6923     return 0;
6924
6925   nunits = GET_MODE_NUNITS (mode);
6926   sel = XALLOCAVEC (unsigned char, nunits);
6927
6928   op = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6929   if (optab_handler (op, mode) != CODE_FOR_nothing)
6930     {
6931       op = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6932       if (optab_handler (op, mode) != CODE_FOR_nothing)
6933         {
6934           for (i = 0; i < nunits; ++i)
6935             sel[i] = !BYTES_BIG_ENDIAN + (i & ~1) + ((i & 1) ? nunits : 0);
6936           if (can_vec_perm_p (mode, false, sel))
6937             return 2;
6938         }
6939     }
6940
6941   op = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6942   if (optab_handler (op, mode) != CODE_FOR_nothing)
6943     {
6944       op = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6945       if (optab_handler (op, mode) != CODE_FOR_nothing)
6946         {
6947           for (i = 0; i < nunits; ++i)
6948             sel[i] = 2 * i + (BYTES_BIG_ENDIAN ? 0 : 1);
6949           if (can_vec_perm_p (mode, false, sel))
6950             return 3;
6951         }
6952     }
6953
6954   return 0;
6955 }
6956
6957 /* Expand a highpart multiply.  */
6958
6959 rtx
6960 expand_mult_highpart (machine_mode mode, rtx op0, rtx op1,
6961                       rtx target, bool uns_p)
6962 {
6963   struct expand_operand eops[3];
6964   enum insn_code icode;
6965   int method, i, nunits;
6966   machine_mode wmode;
6967   rtx m1, m2, perm;
6968   optab tab1, tab2;
6969   rtvec v;
6970
6971   method = can_mult_highpart_p (mode, uns_p);
6972   switch (method)
6973     {
6974     case 0:
6975       return NULL_RTX;
6976     case 1:
6977       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
6978       return expand_binop (mode, tab1, op0, op1, target, uns_p,
6979                            OPTAB_LIB_WIDEN);
6980     case 2:
6981       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6982       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6983       break;
6984     case 3:
6985       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6986       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6987       if (BYTES_BIG_ENDIAN)
6988         {
6989           optab t = tab1;
6990           tab1 = tab2;
6991           tab2 = t;
6992         }
6993       break;
6994     default:
6995       gcc_unreachable ();
6996     }
6997
6998   icode = optab_handler (tab1, mode);
6999   nunits = GET_MODE_NUNITS (mode);
7000   wmode = insn_data[icode].operand[0].mode;
7001   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
7002   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
7003
7004   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
7005   create_input_operand (&eops[1], op0, mode);
7006   create_input_operand (&eops[2], op1, mode);
7007   expand_insn (icode, 3, eops);
7008   m1 = gen_lowpart (mode, eops[0].value);
7009
7010   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
7011   create_input_operand (&eops[1], op0, mode);
7012   create_input_operand (&eops[2], op1, mode);
7013   expand_insn (optab_handler (tab2, mode), 3, eops);
7014   m2 = gen_lowpart (mode, eops[0].value);
7015
7016   v = rtvec_alloc (nunits);
7017   if (method == 2)
7018     {
7019       for (i = 0; i < nunits; ++i)
7020         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
7021                                     + ((i & 1) ? nunits : 0));
7022     }
7023   else
7024     {
7025       for (i = 0; i < nunits; ++i)
7026         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
7027     }
7028   perm = gen_rtx_CONST_VECTOR (mode, v);
7029
7030   return expand_vec_perm (mode, m1, m2, perm, target);
7031 }
7032
7033 /* Return true if target supports vector masked load/store for mode.  */
7034 bool
7035 can_vec_mask_load_store_p (machine_mode mode, bool is_load)
7036 {
7037   optab op = is_load ? maskload_optab : maskstore_optab;
7038   machine_mode vmode;
7039   unsigned int vector_sizes;
7040
7041   /* If mode is vector mode, check it directly.  */
7042   if (VECTOR_MODE_P (mode))
7043     return optab_handler (op, mode) != CODE_FOR_nothing;
7044
7045   /* Otherwise, return true if there is some vector mode with
7046      the mask load/store supported.  */
7047
7048   /* See if there is any chance the mask load or store might be
7049      vectorized.  If not, punt.  */
7050   vmode = targetm.vectorize.preferred_simd_mode (mode);
7051   if (!VECTOR_MODE_P (vmode))
7052     return false;
7053
7054   if (optab_handler (op, vmode) != CODE_FOR_nothing)
7055     return true;
7056
7057   vector_sizes = targetm.vectorize.autovectorize_vector_sizes ();
7058   while (vector_sizes != 0)
7059     {
7060       unsigned int cur = 1 << floor_log2 (vector_sizes);
7061       vector_sizes &= ~cur;
7062       if (cur <= GET_MODE_SIZE (mode))
7063         continue;
7064       vmode = mode_for_vector (mode, cur / GET_MODE_SIZE (mode));
7065       if (VECTOR_MODE_P (vmode)
7066           && optab_handler (op, vmode) != CODE_FOR_nothing)
7067         return true;
7068     }
7069   return false;
7070 }
7071 \f
7072 /* Return true if there is a compare_and_swap pattern.  */
7073
7074 bool
7075 can_compare_and_swap_p (machine_mode mode, bool allow_libcall)
7076 {
7077   enum insn_code icode;
7078
7079   /* Check for __atomic_compare_and_swap.  */
7080   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7081   if (icode != CODE_FOR_nothing)
7082     return true;
7083
7084   /* Check for __sync_compare_and_swap.  */
7085   icode = optab_handler (sync_compare_and_swap_optab, mode);
7086   if (icode != CODE_FOR_nothing)
7087     return true;
7088   if (allow_libcall && optab_libfunc (sync_compare_and_swap_optab, mode))
7089     return true;
7090
7091   /* No inline compare and swap.  */
7092   return false;
7093 }
7094
7095 /* Return true if an atomic exchange can be performed.  */
7096
7097 bool
7098 can_atomic_exchange_p (machine_mode mode, bool allow_libcall)
7099 {
7100   enum insn_code icode;
7101
7102   /* Check for __atomic_exchange.  */
7103   icode = direct_optab_handler (atomic_exchange_optab, mode);
7104   if (icode != CODE_FOR_nothing)
7105     return true;
7106
7107   /* Don't check __sync_test_and_set, as on some platforms that
7108      has reduced functionality.  Targets that really do support
7109      a proper exchange should simply be updated to the __atomics.  */
7110
7111   return can_compare_and_swap_p (mode, allow_libcall);
7112 }
7113
7114
7115 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
7116    pattern.  */
7117
7118 static void
7119 find_cc_set (rtx x, const_rtx pat, void *data)
7120 {
7121   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
7122       && GET_CODE (pat) == SET)
7123     {
7124       rtx *p_cc_reg = (rtx *) data;
7125       gcc_assert (!*p_cc_reg);
7126       *p_cc_reg = x;
7127     }
7128 }
7129
7130 /* This is a helper function for the other atomic operations.  This function
7131    emits a loop that contains SEQ that iterates until a compare-and-swap
7132    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
7133    a set of instructions that takes a value from OLD_REG as an input and
7134    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
7135    set to the current contents of MEM.  After SEQ, a compare-and-swap will
7136    attempt to update MEM with NEW_REG.  The function returns true when the
7137    loop was generated successfully.  */
7138
7139 static bool
7140 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
7141 {
7142   machine_mode mode = GET_MODE (mem);
7143   rtx_code_label *label;
7144   rtx cmp_reg, success, oldval;
7145
7146   /* The loop we want to generate looks like
7147
7148         cmp_reg = mem;
7149       label:
7150         old_reg = cmp_reg;
7151         seq;
7152         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
7153         if (success)
7154           goto label;
7155
7156      Note that we only do the plain load from memory once.  Subsequent
7157      iterations use the value loaded by the compare-and-swap pattern.  */
7158
7159   label = gen_label_rtx ();
7160   cmp_reg = gen_reg_rtx (mode);
7161
7162   emit_move_insn (cmp_reg, mem);
7163   emit_label (label);
7164   emit_move_insn (old_reg, cmp_reg);
7165   if (seq)
7166     emit_insn (seq);
7167
7168   success = NULL_RTX;
7169   oldval = cmp_reg;
7170   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
7171                                        new_reg, false, MEMMODEL_SYNC_SEQ_CST,
7172                                        MEMMODEL_RELAXED))
7173     return false;
7174
7175   if (oldval != cmp_reg)
7176     emit_move_insn (cmp_reg, oldval);
7177
7178   /* Mark this jump predicted not taken.  */
7179   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
7180                            GET_MODE (success), 1, label, 0);
7181   return true;
7182 }
7183
7184
7185 /* This function tries to emit an atomic_exchange intruction.  VAL is written
7186    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
7187    using TARGET if possible.  */
7188
7189 static rtx
7190 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7191 {
7192   machine_mode mode = GET_MODE (mem);
7193   enum insn_code icode;
7194
7195   /* If the target supports the exchange directly, great.  */
7196   icode = direct_optab_handler (atomic_exchange_optab, mode);
7197   if (icode != CODE_FOR_nothing)
7198     {
7199       struct expand_operand ops[4];
7200
7201       create_output_operand (&ops[0], target, mode);
7202       create_fixed_operand (&ops[1], mem);
7203       create_input_operand (&ops[2], val, mode);
7204       create_integer_operand (&ops[3], model);
7205       if (maybe_expand_insn (icode, 4, ops))
7206         return ops[0].value;
7207     }
7208
7209   return NULL_RTX;
7210 }
7211
7212 /* This function tries to implement an atomic exchange operation using
7213    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
7214    The previous contents of *MEM are returned, using TARGET if possible.
7215    Since this instructionn is an acquire barrier only, stronger memory
7216    models may require additional barriers to be emitted.  */
7217
7218 static rtx
7219 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
7220                                    enum memmodel model)
7221 {
7222   machine_mode mode = GET_MODE (mem);
7223   enum insn_code icode;
7224   rtx_insn *last_insn = get_last_insn ();
7225
7226   icode = optab_handler (sync_lock_test_and_set_optab, mode);
7227
7228   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
7229      exists, and the memory model is stronger than acquire, add a release
7230      barrier before the instruction.  */
7231
7232   if (is_mm_seq_cst (model) || is_mm_release (model) || is_mm_acq_rel (model))
7233     expand_mem_thread_fence (model);
7234
7235   if (icode != CODE_FOR_nothing)
7236     {
7237       struct expand_operand ops[3];
7238       create_output_operand (&ops[0], target, mode);
7239       create_fixed_operand (&ops[1], mem);
7240       create_input_operand (&ops[2], val, mode);
7241       if (maybe_expand_insn (icode, 3, ops))
7242         return ops[0].value;
7243     }
7244
7245   /* If an external test-and-set libcall is provided, use that instead of
7246      any external compare-and-swap that we might get from the compare-and-
7247      swap-loop expansion later.  */
7248   if (!can_compare_and_swap_p (mode, false))
7249     {
7250       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
7251       if (libfunc != NULL)
7252         {
7253           rtx addr;
7254
7255           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7256           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7257                                           mode, 2, addr, ptr_mode,
7258                                           val, mode);
7259         }
7260     }
7261
7262   /* If the test_and_set can't be emitted, eliminate any barrier that might
7263      have been emitted.  */
7264   delete_insns_since (last_insn);
7265   return NULL_RTX;
7266 }
7267
7268 /* This function tries to implement an atomic exchange operation using a
7269    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
7270    *MEM are returned, using TARGET if possible.  No memory model is required
7271    since a compare_and_swap loop is seq-cst.  */
7272
7273 static rtx
7274 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
7275 {
7276   machine_mode mode = GET_MODE (mem);
7277
7278   if (can_compare_and_swap_p (mode, true))
7279     {
7280       if (!target || !register_operand (target, mode))
7281         target = gen_reg_rtx (mode);
7282       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
7283         return target;
7284     }
7285
7286   return NULL_RTX;
7287 }
7288
7289 /* This function tries to implement an atomic test-and-set operation
7290    using the atomic_test_and_set instruction pattern.  A boolean value
7291    is returned from the operation, using TARGET if possible.  */
7292
7293 #ifndef HAVE_atomic_test_and_set
7294 #define HAVE_atomic_test_and_set 0
7295 #define CODE_FOR_atomic_test_and_set CODE_FOR_nothing
7296 #endif
7297
7298 static rtx
7299 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7300 {
7301   machine_mode pat_bool_mode;
7302   struct expand_operand ops[3];
7303
7304   if (!HAVE_atomic_test_and_set)
7305     return NULL_RTX;
7306
7307   /* While we always get QImode from __atomic_test_and_set, we get
7308      other memory modes from __sync_lock_test_and_set.  Note that we
7309      use no endian adjustment here.  This matches the 4.6 behavior
7310      in the Sparc backend.  */
7311   gcc_checking_assert
7312     (insn_data[CODE_FOR_atomic_test_and_set].operand[1].mode == QImode);
7313   if (GET_MODE (mem) != QImode)
7314     mem = adjust_address_nv (mem, QImode, 0);
7315
7316   pat_bool_mode = insn_data[CODE_FOR_atomic_test_and_set].operand[0].mode;
7317   create_output_operand (&ops[0], target, pat_bool_mode);
7318   create_fixed_operand (&ops[1], mem);
7319   create_integer_operand (&ops[2], model);
7320
7321   if (maybe_expand_insn (CODE_FOR_atomic_test_and_set, 3, ops))
7322     return ops[0].value;
7323   return NULL_RTX;
7324 }
7325
7326 /* This function expands the legacy _sync_lock test_and_set operation which is
7327    generally an atomic exchange.  Some limited targets only allow the
7328    constant 1 to be stored.  This is an ACQUIRE operation.
7329
7330    TARGET is an optional place to stick the return value.
7331    MEM is where VAL is stored.  */
7332
7333 rtx
7334 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
7335 {
7336   rtx ret;
7337
7338   /* Try an atomic_exchange first.  */
7339   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_SYNC_ACQUIRE);
7340   if (ret)
7341     return ret;
7342
7343   ret = maybe_emit_sync_lock_test_and_set (target, mem, val,
7344                                            MEMMODEL_SYNC_ACQUIRE);
7345   if (ret)
7346     return ret;
7347
7348   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7349   if (ret)
7350     return ret;
7351
7352   /* If there are no other options, try atomic_test_and_set if the value
7353      being stored is 1.  */
7354   if (val == const1_rtx)
7355     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_SYNC_ACQUIRE);
7356
7357   return ret;
7358 }
7359
7360 /* This function expands the atomic test_and_set operation:
7361    atomically store a boolean TRUE into MEM and return the previous value.
7362
7363    MEMMODEL is the memory model variant to use.
7364    TARGET is an optional place to stick the return value.  */
7365
7366 rtx
7367 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7368 {
7369   machine_mode mode = GET_MODE (mem);
7370   rtx ret, trueval, subtarget;
7371
7372   ret = maybe_emit_atomic_test_and_set (target, mem, model);
7373   if (ret)
7374     return ret;
7375
7376   /* Be binary compatible with non-default settings of trueval, and different
7377      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
7378      another only has atomic-exchange.  */
7379   if (targetm.atomic_test_and_set_trueval == 1)
7380     {
7381       trueval = const1_rtx;
7382       subtarget = target ? target : gen_reg_rtx (mode);
7383     }
7384   else
7385     {
7386       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
7387       subtarget = gen_reg_rtx (mode);
7388     }
7389
7390   /* Try the atomic-exchange optab...  */
7391   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
7392
7393   /* ... then an atomic-compare-and-swap loop ... */
7394   if (!ret)
7395     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
7396
7397   /* ... before trying the vaguely defined legacy lock_test_and_set. */
7398   if (!ret)
7399     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
7400
7401   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
7402      things with the value 1.  Thus we try again without trueval.  */
7403   if (!ret && targetm.atomic_test_and_set_trueval != 1)
7404     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
7405
7406   /* Failing all else, assume a single threaded environment and simply
7407      perform the operation.  */
7408   if (!ret)
7409     {
7410       /* If the result is ignored skip the move to target.  */
7411       if (subtarget != const0_rtx)
7412         emit_move_insn (subtarget, mem);
7413
7414       emit_move_insn (mem, trueval);
7415       ret = subtarget;
7416     }
7417
7418   /* Recall that have to return a boolean value; rectify if trueval
7419      is not exactly one.  */
7420   if (targetm.atomic_test_and_set_trueval != 1)
7421     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
7422
7423   return ret;
7424 }
7425
7426 /* This function expands the atomic exchange operation:
7427    atomically store VAL in MEM and return the previous value in MEM.
7428
7429    MEMMODEL is the memory model variant to use.
7430    TARGET is an optional place to stick the return value.  */
7431
7432 rtx
7433 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7434 {
7435   rtx ret;
7436
7437   ret = maybe_emit_atomic_exchange (target, mem, val, model);
7438
7439   /* Next try a compare-and-swap loop for the exchange.  */
7440   if (!ret)
7441     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7442
7443   return ret;
7444 }
7445
7446 /* This function expands the atomic compare exchange operation:
7447
7448    *PTARGET_BOOL is an optional place to store the boolean success/failure.
7449    *PTARGET_OVAL is an optional place to store the old value from memory.
7450    Both target parameters may be NULL to indicate that we do not care about
7451    that return value.  Both target parameters are updated on success to
7452    the actual location of the corresponding result.
7453
7454    MEMMODEL is the memory model variant to use.
7455
7456    The return value of the function is true for success.  */
7457
7458 bool
7459 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
7460                                 rtx mem, rtx expected, rtx desired,
7461                                 bool is_weak, enum memmodel succ_model,
7462                                 enum memmodel fail_model)
7463 {
7464   machine_mode mode = GET_MODE (mem);
7465   struct expand_operand ops[8];
7466   enum insn_code icode;
7467   rtx target_oval, target_bool = NULL_RTX;
7468   rtx libfunc;
7469
7470   /* Load expected into a register for the compare and swap.  */
7471   if (MEM_P (expected))
7472     expected = copy_to_reg (expected);
7473
7474   /* Make sure we always have some place to put the return oldval.
7475      Further, make sure that place is distinct from the input expected,
7476      just in case we need that path down below.  */
7477   if (ptarget_oval == NULL
7478       || (target_oval = *ptarget_oval) == NULL
7479       || reg_overlap_mentioned_p (expected, target_oval))
7480     target_oval = gen_reg_rtx (mode);
7481
7482   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7483   if (icode != CODE_FOR_nothing)
7484     {
7485       machine_mode bool_mode = insn_data[icode].operand[0].mode;
7486
7487       /* Make sure we always have a place for the bool operand.  */
7488       if (ptarget_bool == NULL
7489           || (target_bool = *ptarget_bool) == NULL
7490           || GET_MODE (target_bool) != bool_mode)
7491         target_bool = gen_reg_rtx (bool_mode);
7492
7493       /* Emit the compare_and_swap.  */
7494       create_output_operand (&ops[0], target_bool, bool_mode);
7495       create_output_operand (&ops[1], target_oval, mode);
7496       create_fixed_operand (&ops[2], mem);
7497       create_input_operand (&ops[3], expected, mode);
7498       create_input_operand (&ops[4], desired, mode);
7499       create_integer_operand (&ops[5], is_weak);
7500       create_integer_operand (&ops[6], succ_model);
7501       create_integer_operand (&ops[7], fail_model);
7502       if (maybe_expand_insn (icode, 8, ops))
7503         {
7504           /* Return success/failure.  */
7505           target_bool = ops[0].value;
7506           target_oval = ops[1].value;
7507           goto success;
7508         }
7509     }
7510
7511   /* Otherwise fall back to the original __sync_val_compare_and_swap
7512      which is always seq-cst.  */
7513   icode = optab_handler (sync_compare_and_swap_optab, mode);
7514   if (icode != CODE_FOR_nothing)
7515     {
7516       rtx cc_reg;
7517
7518       create_output_operand (&ops[0], target_oval, mode);
7519       create_fixed_operand (&ops[1], mem);
7520       create_input_operand (&ops[2], expected, mode);
7521       create_input_operand (&ops[3], desired, mode);
7522       if (!maybe_expand_insn (icode, 4, ops))
7523         return false;
7524
7525       target_oval = ops[0].value;
7526
7527       /* If the caller isn't interested in the boolean return value,
7528          skip the computation of it.  */
7529       if (ptarget_bool == NULL)
7530         goto success;
7531
7532       /* Otherwise, work out if the compare-and-swap succeeded.  */
7533       cc_reg = NULL_RTX;
7534       if (have_insn_for (COMPARE, CCmode))
7535         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
7536       if (cc_reg)
7537         {
7538           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
7539                                                const0_rtx, VOIDmode, 0, 1);
7540           goto success;
7541         }
7542       goto success_bool_from_val;
7543     }
7544
7545   /* Also check for library support for __sync_val_compare_and_swap.  */
7546   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
7547   if (libfunc != NULL)
7548     {
7549       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7550       target_oval = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7551                                              mode, 3, addr, ptr_mode,
7552                                              expected, mode, desired, mode);
7553
7554       /* Compute the boolean return value only if requested.  */
7555       if (ptarget_bool)
7556         goto success_bool_from_val;
7557       else
7558         goto success;
7559     }
7560
7561   /* Failure.  */
7562   return false;
7563
7564  success_bool_from_val:
7565    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
7566                                         expected, VOIDmode, 1, 1);
7567  success:
7568   /* Make sure that the oval output winds up where the caller asked.  */
7569   if (ptarget_oval)
7570     *ptarget_oval = target_oval;
7571   if (ptarget_bool)
7572     *ptarget_bool = target_bool;
7573   return true;
7574 }
7575
7576 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
7577
7578 static void
7579 expand_asm_memory_barrier (void)
7580 {
7581   rtx asm_op, clob;
7582
7583   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, empty_string, empty_string, 0,
7584                                  rtvec_alloc (0), rtvec_alloc (0),
7585                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7586   MEM_VOLATILE_P (asm_op) = 1;
7587
7588   clob = gen_rtx_SCRATCH (VOIDmode);
7589   clob = gen_rtx_MEM (BLKmode, clob);
7590   clob = gen_rtx_CLOBBER (VOIDmode, clob);
7591
7592   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
7593 }
7594
7595 /* This routine will either emit the mem_thread_fence pattern or issue a
7596    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7597
7598 #ifndef HAVE_mem_thread_fence
7599 # define HAVE_mem_thread_fence 0
7600 # define gen_mem_thread_fence(x) (gcc_unreachable (), NULL_RTX)
7601 #endif
7602 #ifndef HAVE_memory_barrier
7603 # define HAVE_memory_barrier 0
7604 # define gen_memory_barrier()  (gcc_unreachable (), NULL_RTX)
7605 #endif
7606
7607 void
7608 expand_mem_thread_fence (enum memmodel model)
7609 {
7610   if (HAVE_mem_thread_fence)
7611     emit_insn (gen_mem_thread_fence (GEN_INT (model)));
7612   else if (!is_mm_relaxed (model))
7613     {
7614       if (HAVE_memory_barrier)
7615         emit_insn (gen_memory_barrier ());
7616       else if (synchronize_libfunc != NULL_RTX)
7617         emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
7618       else
7619         expand_asm_memory_barrier ();
7620     }
7621 }
7622
7623 /* This routine will either emit the mem_signal_fence pattern or issue a
7624    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7625
7626 #ifndef HAVE_mem_signal_fence
7627 # define HAVE_mem_signal_fence 0
7628 # define gen_mem_signal_fence(x) (gcc_unreachable (), NULL_RTX)
7629 #endif
7630
7631 void
7632 expand_mem_signal_fence (enum memmodel model)
7633 {
7634   if (HAVE_mem_signal_fence)
7635     emit_insn (gen_mem_signal_fence (GEN_INT (model)));
7636   else if (!is_mm_relaxed (model))
7637     {
7638       /* By default targets are coherent between a thread and the signal
7639          handler running on the same thread.  Thus this really becomes a
7640          compiler barrier, in that stores must not be sunk past
7641          (or raised above) a given point.  */
7642       expand_asm_memory_barrier ();
7643     }
7644 }
7645
7646 /* This function expands the atomic load operation:
7647    return the atomically loaded value in MEM.
7648
7649    MEMMODEL is the memory model variant to use.
7650    TARGET is an option place to stick the return value.  */
7651
7652 rtx
7653 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
7654 {
7655   machine_mode mode = GET_MODE (mem);
7656   enum insn_code icode;
7657
7658   /* If the target supports the load directly, great.  */
7659   icode = direct_optab_handler (atomic_load_optab, mode);
7660   if (icode != CODE_FOR_nothing)
7661     {
7662       struct expand_operand ops[3];
7663
7664       create_output_operand (&ops[0], target, mode);
7665       create_fixed_operand (&ops[1], mem);
7666       create_integer_operand (&ops[2], model);
7667       if (maybe_expand_insn (icode, 3, ops))
7668         return ops[0].value;
7669     }
7670
7671   /* If the size of the object is greater than word size on this target,
7672      then we assume that a load will not be atomic.  */
7673   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7674     {
7675       /* Issue val = compare_and_swap (mem, 0, 0).
7676          This may cause the occasional harmless store of 0 when the value is
7677          already 0, but it seems to be OK according to the standards guys.  */
7678       if (expand_atomic_compare_and_swap (NULL, &target, mem, const0_rtx,
7679                                           const0_rtx, false, model, model))
7680         return target;
7681       else
7682       /* Otherwise there is no atomic load, leave the library call.  */
7683         return NULL_RTX;
7684     }
7685
7686   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
7687   if (!target || target == const0_rtx)
7688     target = gen_reg_rtx (mode);
7689
7690   /* For SEQ_CST, emit a barrier before the load.  */
7691   if (is_mm_seq_cst (model))
7692     expand_mem_thread_fence (model);
7693
7694   emit_move_insn (target, mem);
7695
7696   /* Emit the appropriate barrier after the load.  */
7697   expand_mem_thread_fence (model);
7698
7699   return target;
7700 }
7701
7702 /* This function expands the atomic store operation:
7703    Atomically store VAL in MEM.
7704    MEMMODEL is the memory model variant to use.
7705    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
7706    function returns const0_rtx if a pattern was emitted.  */
7707
7708 rtx
7709 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
7710 {
7711   machine_mode mode = GET_MODE (mem);
7712   enum insn_code icode;
7713   struct expand_operand ops[3];
7714
7715   /* If the target supports the store directly, great.  */
7716   icode = direct_optab_handler (atomic_store_optab, mode);
7717   if (icode != CODE_FOR_nothing)
7718     {
7719       create_fixed_operand (&ops[0], mem);
7720       create_input_operand (&ops[1], val, mode);
7721       create_integer_operand (&ops[2], model);
7722       if (maybe_expand_insn (icode, 3, ops))
7723         return const0_rtx;
7724     }
7725
7726   /* If using __sync_lock_release is a viable alternative, try it.  */
7727   if (use_release)
7728     {
7729       icode = direct_optab_handler (sync_lock_release_optab, mode);
7730       if (icode != CODE_FOR_nothing)
7731         {
7732           create_fixed_operand (&ops[0], mem);
7733           create_input_operand (&ops[1], const0_rtx, mode);
7734           if (maybe_expand_insn (icode, 2, ops))
7735             {
7736               /* lock_release is only a release barrier.  */
7737               if (is_mm_seq_cst (model))
7738                 expand_mem_thread_fence (model);
7739               return const0_rtx;
7740             }
7741         }
7742     }
7743
7744   /* If the size of the object is greater than word size on this target,
7745      a default store will not be atomic, Try a mem_exchange and throw away
7746      the result.  If that doesn't work, don't do anything.  */
7747   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7748     {
7749       rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
7750       if (!target)
7751         target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem, val);
7752       if (target)
7753         return const0_rtx;
7754       else
7755         return NULL_RTX;
7756     }
7757
7758   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
7759   expand_mem_thread_fence (model);
7760
7761   emit_move_insn (mem, val);
7762
7763   /* For SEQ_CST, also emit a barrier after the store.  */
7764   if (is_mm_seq_cst (model))
7765     expand_mem_thread_fence (model);
7766
7767   return const0_rtx;
7768 }
7769
7770
7771 /* Structure containing the pointers and values required to process the
7772    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
7773
7774 struct atomic_op_functions
7775 {
7776   direct_optab mem_fetch_before;
7777   direct_optab mem_fetch_after;
7778   direct_optab mem_no_result;
7779   optab fetch_before;
7780   optab fetch_after;
7781   direct_optab no_result;
7782   enum rtx_code reverse_code;
7783 };
7784
7785
7786 /* Fill in structure pointed to by OP with the various optab entries for an
7787    operation of type CODE.  */
7788
7789 static void
7790 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
7791 {
7792   gcc_assert (op!= NULL);
7793
7794   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
7795      in the source code during compilation, and the optab entries are not
7796      computable until runtime.  Fill in the values at runtime.  */
7797   switch (code)
7798     {
7799     case PLUS:
7800       op->mem_fetch_before = atomic_fetch_add_optab;
7801       op->mem_fetch_after = atomic_add_fetch_optab;
7802       op->mem_no_result = atomic_add_optab;
7803       op->fetch_before = sync_old_add_optab;
7804       op->fetch_after = sync_new_add_optab;
7805       op->no_result = sync_add_optab;
7806       op->reverse_code = MINUS;
7807       break;
7808     case MINUS:
7809       op->mem_fetch_before = atomic_fetch_sub_optab;
7810       op->mem_fetch_after = atomic_sub_fetch_optab;
7811       op->mem_no_result = atomic_sub_optab;
7812       op->fetch_before = sync_old_sub_optab;
7813       op->fetch_after = sync_new_sub_optab;
7814       op->no_result = sync_sub_optab;
7815       op->reverse_code = PLUS;
7816       break;
7817     case XOR:
7818       op->mem_fetch_before = atomic_fetch_xor_optab;
7819       op->mem_fetch_after = atomic_xor_fetch_optab;
7820       op->mem_no_result = atomic_xor_optab;
7821       op->fetch_before = sync_old_xor_optab;
7822       op->fetch_after = sync_new_xor_optab;
7823       op->no_result = sync_xor_optab;
7824       op->reverse_code = XOR;
7825       break;
7826     case AND:
7827       op->mem_fetch_before = atomic_fetch_and_optab;
7828       op->mem_fetch_after = atomic_and_fetch_optab;
7829       op->mem_no_result = atomic_and_optab;
7830       op->fetch_before = sync_old_and_optab;
7831       op->fetch_after = sync_new_and_optab;
7832       op->no_result = sync_and_optab;
7833       op->reverse_code = UNKNOWN;
7834       break;
7835     case IOR:
7836       op->mem_fetch_before = atomic_fetch_or_optab;
7837       op->mem_fetch_after = atomic_or_fetch_optab;
7838       op->mem_no_result = atomic_or_optab;
7839       op->fetch_before = sync_old_ior_optab;
7840       op->fetch_after = sync_new_ior_optab;
7841       op->no_result = sync_ior_optab;
7842       op->reverse_code = UNKNOWN;
7843       break;
7844     case NOT:
7845       op->mem_fetch_before = atomic_fetch_nand_optab;
7846       op->mem_fetch_after = atomic_nand_fetch_optab;
7847       op->mem_no_result = atomic_nand_optab;
7848       op->fetch_before = sync_old_nand_optab;
7849       op->fetch_after = sync_new_nand_optab;
7850       op->no_result = sync_nand_optab;
7851       op->reverse_code = UNKNOWN;
7852       break;
7853     default:
7854       gcc_unreachable ();
7855     }
7856 }
7857
7858 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
7859    using memory order MODEL.  If AFTER is true the operation needs to return
7860    the value of *MEM after the operation, otherwise the previous value.
7861    TARGET is an optional place to place the result.  The result is unused if
7862    it is const0_rtx.
7863    Return the result if there is a better sequence, otherwise NULL_RTX.  */
7864
7865 static rtx
7866 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7867                          enum memmodel model, bool after)
7868 {
7869   /* If the value is prefetched, or not used, it may be possible to replace
7870      the sequence with a native exchange operation.  */
7871   if (!after || target == const0_rtx)
7872     {
7873       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
7874       if (code == AND && val == const0_rtx)
7875         {
7876           if (target == const0_rtx)
7877             target = gen_reg_rtx (GET_MODE (mem));
7878           return maybe_emit_atomic_exchange (target, mem, val, model);
7879         }
7880
7881       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
7882       if (code == IOR && val == constm1_rtx)
7883         {
7884           if (target == const0_rtx)
7885             target = gen_reg_rtx (GET_MODE (mem));
7886           return maybe_emit_atomic_exchange (target, mem, val, model);
7887         }
7888     }
7889
7890   return NULL_RTX;
7891 }
7892
7893 /* Try to emit an instruction for a specific operation varaition.
7894    OPTAB contains the OP functions.
7895    TARGET is an optional place to return the result. const0_rtx means unused.
7896    MEM is the memory location to operate on.
7897    VAL is the value to use in the operation.
7898    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
7899    MODEL is the memory model, if used.
7900    AFTER is true if the returned result is the value after the operation.  */
7901
7902 static rtx
7903 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
7904                rtx val, bool use_memmodel, enum memmodel model, bool after)
7905 {
7906   machine_mode mode = GET_MODE (mem);
7907   struct expand_operand ops[4];
7908   enum insn_code icode;
7909   int op_counter = 0;
7910   int num_ops;
7911
7912   /* Check to see if there is a result returned.  */
7913   if (target == const0_rtx)
7914     {
7915       if (use_memmodel)
7916         {
7917           icode = direct_optab_handler (optab->mem_no_result, mode);
7918           create_integer_operand (&ops[2], model);
7919           num_ops = 3;
7920         }
7921       else
7922         {
7923           icode = direct_optab_handler (optab->no_result, mode);
7924           num_ops = 2;
7925         }
7926     }
7927   /* Otherwise, we need to generate a result.  */
7928   else
7929     {
7930       if (use_memmodel)
7931         {
7932           icode = direct_optab_handler (after ? optab->mem_fetch_after
7933                                         : optab->mem_fetch_before, mode);
7934           create_integer_operand (&ops[3], model);
7935           num_ops = 4;
7936         }
7937       else
7938         {
7939           icode = optab_handler (after ? optab->fetch_after
7940                                  : optab->fetch_before, mode);
7941           num_ops = 3;
7942         }
7943       create_output_operand (&ops[op_counter++], target, mode);
7944     }
7945   if (icode == CODE_FOR_nothing)
7946     return NULL_RTX;
7947
7948   create_fixed_operand (&ops[op_counter++], mem);
7949   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
7950   create_convert_operand_to (&ops[op_counter++], val, mode, true);
7951
7952   if (maybe_expand_insn (icode, num_ops, ops))
7953     return (target == const0_rtx ? const0_rtx : ops[0].value);
7954
7955   return NULL_RTX;
7956 }
7957
7958
7959 /* This function expands an atomic fetch_OP or OP_fetch operation:
7960    TARGET is an option place to stick the return value.  const0_rtx indicates
7961    the result is unused.
7962    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7963    CODE is the operation being performed (OP)
7964    MEMMODEL is the memory model variant to use.
7965    AFTER is true to return the result of the operation (OP_fetch).
7966    AFTER is false to return the value before the operation (fetch_OP).
7967
7968    This function will *only* generate instructions if there is a direct
7969    optab. No compare and swap loops or libcalls will be generated. */
7970
7971 static rtx
7972 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
7973                                     enum rtx_code code, enum memmodel model,
7974                                     bool after)
7975 {
7976   machine_mode mode = GET_MODE (mem);
7977   struct atomic_op_functions optab;
7978   rtx result;
7979   bool unused_result = (target == const0_rtx);
7980
7981   get_atomic_op_for_code (&optab, code);
7982
7983   /* Check to see if there are any better instructions.  */
7984   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
7985   if (result)
7986     return result;
7987
7988   /* Check for the case where the result isn't used and try those patterns.  */
7989   if (unused_result)
7990     {
7991       /* Try the memory model variant first.  */
7992       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
7993       if (result)
7994         return result;
7995
7996       /* Next try the old style withuot a memory model.  */
7997       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
7998       if (result)
7999         return result;
8000
8001       /* There is no no-result pattern, so try patterns with a result.  */
8002       target = NULL_RTX;
8003     }
8004
8005   /* Try the __atomic version.  */
8006   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
8007   if (result)
8008     return result;
8009
8010   /* Try the older __sync version.  */
8011   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
8012   if (result)
8013     return result;
8014
8015   /* If the fetch value can be calculated from the other variation of fetch,
8016      try that operation.  */
8017   if (after || unused_result || optab.reverse_code != UNKNOWN)
8018     {
8019       /* Try the __atomic version, then the older __sync version.  */
8020       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
8021       if (!result)
8022         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
8023
8024       if (result)
8025         {
8026           /* If the result isn't used, no need to do compensation code.  */
8027           if (unused_result)
8028             return result;
8029
8030           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
8031              Fetch_before == after REVERSE_OP val.  */
8032           if (!after)
8033             code = optab.reverse_code;
8034           if (code == NOT)
8035             {
8036               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
8037                                             true, OPTAB_LIB_WIDEN);
8038               result = expand_simple_unop (mode, NOT, result, target, true);
8039             }
8040           else
8041             result = expand_simple_binop (mode, code, result, val, target,
8042                                           true, OPTAB_LIB_WIDEN);
8043           return result;
8044         }
8045     }
8046
8047   /* No direct opcode can be generated.  */
8048   return NULL_RTX;
8049 }
8050
8051
8052
8053 /* This function expands an atomic fetch_OP or OP_fetch operation:
8054    TARGET is an option place to stick the return value.  const0_rtx indicates
8055    the result is unused.
8056    atomically fetch MEM, perform the operation with VAL and return it to MEM.
8057    CODE is the operation being performed (OP)
8058    MEMMODEL is the memory model variant to use.
8059    AFTER is true to return the result of the operation (OP_fetch).
8060    AFTER is false to return the value before the operation (fetch_OP).  */
8061 rtx
8062 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
8063                         enum memmodel model, bool after)
8064 {
8065   machine_mode mode = GET_MODE (mem);
8066   rtx result;
8067   bool unused_result = (target == const0_rtx);
8068
8069   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
8070                                                after);
8071
8072   if (result)
8073     return result;
8074
8075   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
8076   if (code == PLUS || code == MINUS)
8077     {
8078       rtx tmp;
8079       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
8080
8081       start_sequence ();
8082       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
8083       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
8084                                                    model, after);
8085       if (result)
8086         {
8087           /* PLUS worked so emit the insns and return.  */
8088           tmp = get_insns ();
8089           end_sequence ();
8090           emit_insn (tmp);
8091           return result;
8092         }
8093
8094       /* PLUS did not work, so throw away the negation code and continue.  */
8095       end_sequence ();
8096     }
8097
8098   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
8099   if (!can_compare_and_swap_p (mode, false))
8100     {
8101       rtx libfunc;
8102       bool fixup = false;
8103       enum rtx_code orig_code = code;
8104       struct atomic_op_functions optab;
8105
8106       get_atomic_op_for_code (&optab, code);
8107       libfunc = optab_libfunc (after ? optab.fetch_after
8108                                : optab.fetch_before, mode);
8109       if (libfunc == NULL
8110           && (after || unused_result || optab.reverse_code != UNKNOWN))
8111         {
8112           fixup = true;
8113           if (!after)
8114             code = optab.reverse_code;
8115           libfunc = optab_libfunc (after ? optab.fetch_before
8116                                    : optab.fetch_after, mode);
8117         }
8118       if (libfunc != NULL)
8119         {
8120           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
8121           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
8122                                             2, addr, ptr_mode, val, mode);
8123
8124           if (!unused_result && fixup)
8125             result = expand_simple_binop (mode, code, result, val, target,
8126                                           true, OPTAB_LIB_WIDEN);
8127           return result;
8128         }
8129
8130       /* We need the original code for any further attempts.  */
8131       code = orig_code;
8132     }
8133
8134   /* If nothing else has succeeded, default to a compare and swap loop.  */
8135   if (can_compare_and_swap_p (mode, true))
8136     {
8137       rtx_insn *insn;
8138       rtx t0 = gen_reg_rtx (mode), t1;
8139
8140       start_sequence ();
8141
8142       /* If the result is used, get a register for it.  */
8143       if (!unused_result)
8144         {
8145           if (!target || !register_operand (target, mode))
8146             target = gen_reg_rtx (mode);
8147           /* If fetch_before, copy the value now.  */
8148           if (!after)
8149             emit_move_insn (target, t0);
8150         }
8151       else
8152         target = const0_rtx;
8153
8154       t1 = t0;
8155       if (code == NOT)
8156         {
8157           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
8158                                     true, OPTAB_LIB_WIDEN);
8159           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
8160         }
8161       else
8162         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
8163                                   OPTAB_LIB_WIDEN);
8164
8165       /* For after, copy the value now.  */
8166       if (!unused_result && after)
8167         emit_move_insn (target, t1);
8168       insn = get_insns ();
8169       end_sequence ();
8170
8171       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
8172         return target;
8173     }
8174
8175   return NULL_RTX;
8176 }
8177 \f
8178 /* Return true if OPERAND is suitable for operand number OPNO of
8179    instruction ICODE.  */
8180
8181 bool
8182 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
8183 {
8184   return (!insn_data[(int) icode].operand[opno].predicate
8185           || (insn_data[(int) icode].operand[opno].predicate
8186               (operand, insn_data[(int) icode].operand[opno].mode)));
8187 }
8188 \f
8189 /* TARGET is a target of a multiword operation that we are going to
8190    implement as a series of word-mode operations.  Return true if
8191    TARGET is suitable for this purpose.  */
8192
8193 bool
8194 valid_multiword_target_p (rtx target)
8195 {
8196   machine_mode mode;
8197   int i;
8198
8199   mode = GET_MODE (target);
8200   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
8201     if (!validate_subreg (word_mode, mode, target, i))
8202       return false;
8203   return true;
8204 }
8205
8206 /* Like maybe_legitimize_operand, but do not change the code of the
8207    current rtx value.  */
8208
8209 static bool
8210 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
8211                                     struct expand_operand *op)
8212 {
8213   /* See if the operand matches in its current form.  */
8214   if (insn_operand_matches (icode, opno, op->value))
8215     return true;
8216
8217   /* If the operand is a memory whose address has no side effects,
8218      try forcing the address into a non-virtual pseudo register.
8219      The check for side effects is important because copy_to_mode_reg
8220      cannot handle things like auto-modified addresses.  */
8221   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
8222     {
8223       rtx addr, mem;
8224
8225       mem = op->value;
8226       addr = XEXP (mem, 0);
8227       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
8228           && !side_effects_p (addr))
8229         {
8230           rtx_insn *last;
8231           machine_mode mode;
8232
8233           last = get_last_insn ();
8234           mode = get_address_mode (mem);
8235           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
8236           if (insn_operand_matches (icode, opno, mem))
8237             {
8238               op->value = mem;
8239               return true;
8240             }
8241           delete_insns_since (last);
8242         }
8243     }
8244
8245   return false;
8246 }
8247
8248 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
8249    on success, storing the new operand value back in OP.  */
8250
8251 static bool
8252 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
8253                           struct expand_operand *op)
8254 {
8255   machine_mode mode, imode;
8256   bool old_volatile_ok, result;
8257
8258   mode = op->mode;
8259   switch (op->type)
8260     {
8261     case EXPAND_FIXED:
8262       old_volatile_ok = volatile_ok;
8263       volatile_ok = true;
8264       result = maybe_legitimize_operand_same_code (icode, opno, op);
8265       volatile_ok = old_volatile_ok;
8266       return result;
8267
8268     case EXPAND_OUTPUT:
8269       gcc_assert (mode != VOIDmode);
8270       if (op->value
8271           && op->value != const0_rtx
8272           && GET_MODE (op->value) == mode
8273           && maybe_legitimize_operand_same_code (icode, opno, op))
8274         return true;
8275
8276       op->value = gen_reg_rtx (mode);
8277       break;
8278
8279     case EXPAND_INPUT:
8280     input:
8281       gcc_assert (mode != VOIDmode);
8282       gcc_assert (GET_MODE (op->value) == VOIDmode
8283                   || GET_MODE (op->value) == mode);
8284       if (maybe_legitimize_operand_same_code (icode, opno, op))
8285         return true;
8286
8287       op->value = copy_to_mode_reg (mode, op->value);
8288       break;
8289
8290     case EXPAND_CONVERT_TO:
8291       gcc_assert (mode != VOIDmode);
8292       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
8293       goto input;
8294
8295     case EXPAND_CONVERT_FROM:
8296       if (GET_MODE (op->value) != VOIDmode)
8297         mode = GET_MODE (op->value);
8298       else
8299         /* The caller must tell us what mode this value has.  */
8300         gcc_assert (mode != VOIDmode);
8301
8302       imode = insn_data[(int) icode].operand[opno].mode;
8303       if (imode != VOIDmode && imode != mode)
8304         {
8305           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
8306           mode = imode;
8307         }
8308       goto input;
8309
8310     case EXPAND_ADDRESS:
8311       gcc_assert (mode != VOIDmode);
8312       op->value = convert_memory_address (mode, op->value);
8313       goto input;
8314
8315     case EXPAND_INTEGER:
8316       mode = insn_data[(int) icode].operand[opno].mode;
8317       if (mode != VOIDmode && const_int_operand (op->value, mode))
8318         goto input;
8319       break;
8320     }
8321   return insn_operand_matches (icode, opno, op->value);
8322 }
8323
8324 /* Make OP describe an input operand that should have the same value
8325    as VALUE, after any mode conversion that the target might request.
8326    TYPE is the type of VALUE.  */
8327
8328 void
8329 create_convert_operand_from_type (struct expand_operand *op,
8330                                   rtx value, tree type)
8331 {
8332   create_convert_operand_from (op, value, TYPE_MODE (type),
8333                                TYPE_UNSIGNED (type));
8334 }
8335
8336 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
8337    of instruction ICODE.  Return true on success, leaving the new operand
8338    values in the OPS themselves.  Emit no code on failure.  */
8339
8340 bool
8341 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
8342                            unsigned int nops, struct expand_operand *ops)
8343 {
8344   rtx_insn *last;
8345   unsigned int i;
8346
8347   last = get_last_insn ();
8348   for (i = 0; i < nops; i++)
8349     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
8350       {
8351         delete_insns_since (last);
8352         return false;
8353       }
8354   return true;
8355 }
8356
8357 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
8358    as its operands.  Return the instruction pattern on success,
8359    and emit any necessary set-up code.  Return null and emit no
8360    code on failure.  */
8361
8362 rtx_insn *
8363 maybe_gen_insn (enum insn_code icode, unsigned int nops,
8364                 struct expand_operand *ops)
8365 {
8366   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
8367   if (!maybe_legitimize_operands (icode, 0, nops, ops))
8368     return NULL;
8369
8370   switch (nops)
8371     {
8372     case 1:
8373       return GEN_FCN (icode) (ops[0].value);
8374     case 2:
8375       return GEN_FCN (icode) (ops[0].value, ops[1].value);
8376     case 3:
8377       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
8378     case 4:
8379       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8380                               ops[3].value);
8381     case 5:
8382       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8383                               ops[3].value, ops[4].value);
8384     case 6:
8385       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8386                               ops[3].value, ops[4].value, ops[5].value);
8387     case 7:
8388       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8389                               ops[3].value, ops[4].value, ops[5].value,
8390                               ops[6].value);
8391     case 8:
8392       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8393                               ops[3].value, ops[4].value, ops[5].value,
8394                               ops[6].value, ops[7].value);
8395     case 9:
8396       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8397                               ops[3].value, ops[4].value, ops[5].value,
8398                               ops[6].value, ops[7].value, ops[8].value);
8399     }
8400   gcc_unreachable ();
8401 }
8402
8403 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
8404    as its operands.  Return true on success and emit no code on failure.  */
8405
8406 bool
8407 maybe_expand_insn (enum insn_code icode, unsigned int nops,
8408                    struct expand_operand *ops)
8409 {
8410   rtx pat = maybe_gen_insn (icode, nops, ops);
8411   if (pat)
8412     {
8413       emit_insn (pat);
8414       return true;
8415     }
8416   return false;
8417 }
8418
8419 /* Like maybe_expand_insn, but for jumps.  */
8420
8421 bool
8422 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
8423                         struct expand_operand *ops)
8424 {
8425   rtx pat = maybe_gen_insn (icode, nops, ops);
8426   if (pat)
8427     {
8428       emit_jump_insn (pat);
8429       return true;
8430     }
8431   return false;
8432 }
8433
8434 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
8435    as its operands.  */
8436
8437 void
8438 expand_insn (enum insn_code icode, unsigned int nops,
8439              struct expand_operand *ops)
8440 {
8441   if (!maybe_expand_insn (icode, nops, ops))
8442     gcc_unreachable ();
8443 }
8444
8445 /* Like expand_insn, but for jumps.  */
8446
8447 void
8448 expand_jump_insn (enum insn_code icode, unsigned int nops,
8449                   struct expand_operand *ops)
8450 {
8451   if (!maybe_expand_jump_insn (icode, nops, ops))
8452     gcc_unreachable ();
8453 }
8454
8455 /* Reduce conditional compilation elsewhere.  */
8456 #ifndef HAVE_insv
8457 #define HAVE_insv       0
8458 #define CODE_FOR_insv   CODE_FOR_nothing
8459 #endif
8460 #ifndef HAVE_extv
8461 #define HAVE_extv       0
8462 #define CODE_FOR_extv   CODE_FOR_nothing
8463 #endif
8464 #ifndef HAVE_extzv
8465 #define HAVE_extzv      0
8466 #define CODE_FOR_extzv  CODE_FOR_nothing
8467 #endif
8468
8469 /* Enumerates the possible types of structure operand to an
8470    extraction_insn.  */
8471 enum extraction_type { ET_unaligned_mem, ET_reg };
8472
8473 /* Check whether insv, extv or extzv pattern ICODE can be used for an
8474    insertion or extraction of type TYPE on a structure of mode MODE.
8475    Return true if so and fill in *INSN accordingly.  STRUCT_OP is the
8476    operand number of the structure (the first sign_extract or zero_extract
8477    operand) and FIELD_OP is the operand number of the field (the other
8478    side of the set from the sign_extract or zero_extract).  */
8479
8480 static bool
8481 get_traditional_extraction_insn (extraction_insn *insn,
8482                                  enum extraction_type type,
8483                                  machine_mode mode,
8484                                  enum insn_code icode,
8485                                  int struct_op, int field_op)
8486 {
8487   const struct insn_data_d *data = &insn_data[icode];
8488
8489   machine_mode struct_mode = data->operand[struct_op].mode;
8490   if (struct_mode == VOIDmode)
8491     struct_mode = word_mode;
8492   if (mode != struct_mode)
8493     return false;
8494
8495   machine_mode field_mode = data->operand[field_op].mode;
8496   if (field_mode == VOIDmode)
8497     field_mode = word_mode;
8498
8499   machine_mode pos_mode = data->operand[struct_op + 2].mode;
8500   if (pos_mode == VOIDmode)
8501     pos_mode = word_mode;
8502
8503   insn->icode = icode;
8504   insn->field_mode = field_mode;
8505   insn->struct_mode = (type == ET_unaligned_mem ? byte_mode : struct_mode);
8506   insn->pos_mode = pos_mode;
8507   return true;
8508 }
8509
8510 /* Return true if an optab exists to perform an insertion or extraction
8511    of type TYPE in mode MODE.  Describe the instruction in *INSN if so.
8512
8513    REG_OPTAB is the optab to use for register structures and
8514    MISALIGN_OPTAB is the optab to use for misaligned memory structures.
8515    POS_OP is the operand number of the bit position.  */
8516
8517 static bool
8518 get_optab_extraction_insn (struct extraction_insn *insn,
8519                            enum extraction_type type,
8520                            machine_mode mode, direct_optab reg_optab,
8521                            direct_optab misalign_optab, int pos_op)
8522 {
8523   direct_optab optab = (type == ET_unaligned_mem ? misalign_optab : reg_optab);
8524   enum insn_code icode = direct_optab_handler (optab, mode);
8525   if (icode == CODE_FOR_nothing)
8526     return false;
8527
8528   const struct insn_data_d *data = &insn_data[icode];
8529
8530   insn->icode = icode;
8531   insn->field_mode = mode;
8532   insn->struct_mode = (type == ET_unaligned_mem ? BLKmode : mode);
8533   insn->pos_mode = data->operand[pos_op].mode;
8534   if (insn->pos_mode == VOIDmode)
8535     insn->pos_mode = word_mode;
8536   return true;
8537 }
8538
8539 /* Return true if an instruction exists to perform an insertion or
8540    extraction (PATTERN says which) of type TYPE in mode MODE.
8541    Describe the instruction in *INSN if so.  */
8542
8543 static bool
8544 get_extraction_insn (extraction_insn *insn,
8545                      enum extraction_pattern pattern,
8546                      enum extraction_type type,
8547                      machine_mode mode)
8548 {
8549   switch (pattern)
8550     {
8551     case EP_insv:
8552       if (HAVE_insv
8553           && get_traditional_extraction_insn (insn, type, mode,
8554                                               CODE_FOR_insv, 0, 3))
8555         return true;
8556       return get_optab_extraction_insn (insn, type, mode, insv_optab,
8557                                         insvmisalign_optab, 2);
8558
8559     case EP_extv:
8560       if (HAVE_extv
8561           && get_traditional_extraction_insn (insn, type, mode,
8562                                               CODE_FOR_extv, 1, 0))
8563         return true;
8564       return get_optab_extraction_insn (insn, type, mode, extv_optab,
8565                                         extvmisalign_optab, 3);
8566
8567     case EP_extzv:
8568       if (HAVE_extzv
8569           && get_traditional_extraction_insn (insn, type, mode,
8570                                               CODE_FOR_extzv, 1, 0))
8571         return true;
8572       return get_optab_extraction_insn (insn, type, mode, extzv_optab,
8573                                         extzvmisalign_optab, 3);
8574
8575     default:
8576       gcc_unreachable ();
8577     }
8578 }
8579
8580 /* Return true if an instruction exists to access a field of mode
8581    FIELDMODE in a structure that has STRUCT_BITS significant bits.
8582    Describe the "best" such instruction in *INSN if so.  PATTERN and
8583    TYPE describe the type of insertion or extraction we want to perform.
8584
8585    For an insertion, the number of significant structure bits includes
8586    all bits of the target.  For an extraction, it need only include the
8587    most significant bit of the field.  Larger widths are acceptable
8588    in both cases.  */
8589
8590 static bool
8591 get_best_extraction_insn (extraction_insn *insn,
8592                           enum extraction_pattern pattern,
8593                           enum extraction_type type,
8594                           unsigned HOST_WIDE_INT struct_bits,
8595                           machine_mode field_mode)
8596 {
8597   machine_mode mode = smallest_mode_for_size (struct_bits, MODE_INT);
8598   while (mode != VOIDmode)
8599     {
8600       if (get_extraction_insn (insn, pattern, type, mode))
8601         {
8602           while (mode != VOIDmode
8603                  && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (field_mode)
8604                  && !TRULY_NOOP_TRUNCATION_MODES_P (insn->field_mode,
8605                                                     field_mode))
8606             {
8607               get_extraction_insn (insn, pattern, type, mode);
8608               mode = GET_MODE_WIDER_MODE (mode);
8609             }
8610           return true;
8611         }
8612       mode = GET_MODE_WIDER_MODE (mode);
8613     }
8614   return false;
8615 }
8616
8617 /* Return true if an instruction exists to access a field of mode
8618    FIELDMODE in a register structure that has STRUCT_BITS significant bits.
8619    Describe the "best" such instruction in *INSN if so.  PATTERN describes
8620    the type of insertion or extraction we want to perform.
8621
8622    For an insertion, the number of significant structure bits includes
8623    all bits of the target.  For an extraction, it need only include the
8624    most significant bit of the field.  Larger widths are acceptable
8625    in both cases.  */
8626
8627 bool
8628 get_best_reg_extraction_insn (extraction_insn *insn,
8629                               enum extraction_pattern pattern,
8630                               unsigned HOST_WIDE_INT struct_bits,
8631                               machine_mode field_mode)
8632 {
8633   return get_best_extraction_insn (insn, pattern, ET_reg, struct_bits,
8634                                    field_mode);
8635 }
8636
8637 /* Return true if an instruction exists to access a field of BITSIZE
8638    bits starting BITNUM bits into a memory structure.  Describe the
8639    "best" such instruction in *INSN if so.  PATTERN describes the type
8640    of insertion or extraction we want to perform and FIELDMODE is the
8641    natural mode of the extracted field.
8642
8643    The instructions considered here only access bytes that overlap
8644    the bitfield; they do not touch any surrounding bytes.  */
8645
8646 bool
8647 get_best_mem_extraction_insn (extraction_insn *insn,
8648                               enum extraction_pattern pattern,
8649                               HOST_WIDE_INT bitsize, HOST_WIDE_INT bitnum,
8650                               machine_mode field_mode)
8651 {
8652   unsigned HOST_WIDE_INT struct_bits = (bitnum % BITS_PER_UNIT
8653                                         + bitsize
8654                                         + BITS_PER_UNIT - 1);
8655   struct_bits -= struct_bits % BITS_PER_UNIT;
8656   return get_best_extraction_insn (insn, pattern, ET_unaligned_mem,
8657                                    struct_bits, field_mode);
8658 }
8659
8660 /* Determine whether "1 << x" is relatively cheap in word_mode.  */
8661
8662 bool
8663 lshift_cheap_p (bool speed_p)
8664 {
8665   /* FIXME: This should be made target dependent via this "this_target"
8666      mechanism, similar to e.g. can_copy_init_p in gcse.c.  */
8667   static bool init[2] = { false, false };
8668   static bool cheap[2] = { true, true };
8669
8670   /* If the targer has no lshift in word_mode, the operation will most
8671      probably not be cheap.  ??? Does GCC even work for such targets?  */
8672   if (optab_handler (ashl_optab, word_mode) == CODE_FOR_nothing)
8673     return false;
8674
8675   if (!init[speed_p])
8676     {
8677       rtx reg = gen_raw_REG (word_mode, 10000);
8678       int cost = set_src_cost (gen_rtx_ASHIFT (word_mode, const1_rtx, reg),
8679                                speed_p);
8680       cheap[speed_p] = cost < COSTS_N_INSNS (3);
8681       init[speed_p] = true;
8682     }
8683
8684   return cheap[speed_p];
8685 }
8686
8687 #include "gt-optabs.h"