gcc/internal-fn.c

   1 /* Internal functions.
   2    Copyright (C) 2011-2018 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 #include "config.h"
  21 #include "system.h"
  22 #include "coretypes.h"
  23 #include "backend.h"
  24 #include "target.h"
  25 #include "rtl.h"
  26 #include "tree.h"
  27 #include "gimple.h"
  28 #include "predict.h"
  29 #include "stringpool.h"
  30 #include "tree-vrp.h"
  31 #include "tree-ssanames.h"
  32 #include "expmed.h"
  33 #include "memmodel.h"
  34 #include "optabs.h"
  35 #include "emit-rtl.h"
  36 #include "diagnostic-core.h"
  37 #include "fold-const.h"
  38 #include "internal-fn.h"
  39 #include "stor-layout.h"
  40 #include "dojump.h"
  41 #include "expr.h"
  42 #include "stringpool.h"
  43 #include "attribs.h"
  44 #include "asan.h"
  45 #include "ubsan.h"
  46 #include "recog.h"
  47 #include "builtins.h"
  48 #include "optabs-tree.h"
  49 #include "gimple-ssa.h"
  50 #include "tree-phinodes.h"
  51 #include "ssa-iterators.h"
  52
  53 /* The names of each internal function, indexed by function number.  */
  54 const char *const internal_fn_name_array[] = {
  55 #define DEF_INTERNAL_FN(CODE, FLAGS, FNSPEC) #CODE,
  56 #include "internal-fn.def"
  57   "<invalid-fn>"
  58 };
  59
  60 /* The ECF_* flags of each internal function, indexed by function number.  */
  61 const int internal_fn_flags_array[] = {
  62 #define DEF_INTERNAL_FN(CODE, FLAGS, FNSPEC) FLAGS,
  63 #include "internal-fn.def"
  64   0
  65 };
  66
  67 /* Fnspec of each internal function, indexed by function number.  */
  68 const_tree internal_fn_fnspec_array[IFN_LAST + 1];
  69
  70 void
  71 init_internal_fns ()
  72 {
  73 #define DEF_INTERNAL_FN(CODE, FLAGS, FNSPEC) \
  74   if (FNSPEC) internal_fn_fnspec_array[IFN_##CODE] = \
  75     build_string ((int) sizeof (FNSPEC), FNSPEC ? FNSPEC : "");
  76 #include "internal-fn.def"
  77   internal_fn_fnspec_array[IFN_LAST] = 0;
  78 }
  79
  80 /* Create static initializers for the information returned by
  81    direct_internal_fn.  */
  82 #define not_direct { -2, -2, false }
  83 #define mask_load_direct { -1, 2, false }
  84 #define load_lanes_direct { -1, -1, false }
  85 #define mask_load_lanes_direct { -1, -1, false }
  86 #define mask_store_direct { 3, 2, false }
  87 #define store_lanes_direct { 0, 0, false }
  88 #define mask_store_lanes_direct { 0, 0, false }
  89 #define unary_direct { 0, 0, true }
  90 #define binary_direct { 0, 0, true }
  91 #define cond_unary_direct { 1, 1, true }
  92 #define cond_binary_direct { 1, 1, true }
  93 #define while_direct { 0, 2, false }
  94 #define fold_extract_direct { 2, 2, false }
  95 #define fold_left_direct { 1, 1, false }
  96
  97 const direct_internal_fn_info direct_internal_fn_array[IFN_LAST + 1] = {
  98 #define DEF_INTERNAL_FN(CODE, FLAGS, FNSPEC) not_direct,
  99 #define DEF_INTERNAL_OPTAB_FN(CODE, FLAGS, OPTAB, TYPE) TYPE##_direct,
 100 #define DEF_INTERNAL_SIGNED_OPTAB_FN(CODE, FLAGS, SELECTOR, SIGNED_OPTAB, \
 101                                      UNSIGNED_OPTAB, TYPE) TYPE##_direct,
 102 #include "internal-fn.def"
 103   not_direct
 104 };
 105
 106 /* ARRAY_TYPE is an array of vector modes.  Return the associated insn
 107    for load-lanes-style optab OPTAB, or CODE_FOR_nothing if none.  */
 108
 109 static enum insn_code
 110 get_multi_vector_move (tree array_type, convert_optab optab)
 111 {
 112   machine_mode imode;
 113   machine_mode vmode;
 114
 115   gcc_assert (TREE_CODE (array_type) == ARRAY_TYPE);
 116   imode = TYPE_MODE (array_type);
 117   vmode = TYPE_MODE (TREE_TYPE (array_type));
 118
 119   return convert_optab_handler (optab, imode, vmode);
 120 }
 121
 122 /* Expand LOAD_LANES call STMT using optab OPTAB.  */
 123
 124 static void
 125 expand_load_lanes_optab_fn (internal_fn, gcall *stmt, convert_optab optab)
 126 {
 127   struct expand_operand ops[2];
 128   tree type, lhs, rhs;
 129   rtx target, mem;
 130
 131   lhs = gimple_call_lhs (stmt);
 132   rhs = gimple_call_arg (stmt, 0);
 133   type = TREE_TYPE (lhs);
 134
 135   target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 136   mem = expand_normal (rhs);
 137
 138   gcc_assert (MEM_P (mem));
 139   PUT_MODE (mem, TYPE_MODE (type));
 140
 141   create_output_operand (&ops[0], target, TYPE_MODE (type));
 142   create_fixed_operand (&ops[1], mem);
 143   expand_insn (get_multi_vector_move (type, optab), 2, ops);
 144 }
 145
 146 /* Expand STORE_LANES call STMT using optab OPTAB.  */
 147
 148 static void
 149 expand_store_lanes_optab_fn (internal_fn, gcall *stmt, convert_optab optab)
 150 {
 151   struct expand_operand ops[2];
 152   tree type, lhs, rhs;
 153   rtx target, reg;
 154
 155   lhs = gimple_call_lhs (stmt);
 156   rhs = gimple_call_arg (stmt, 0);
 157   type = TREE_TYPE (rhs);
 158
 159   target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 160   reg = expand_normal (rhs);
 161
 162   gcc_assert (MEM_P (target));
 163   PUT_MODE (target, TYPE_MODE (type));
 164
 165   create_fixed_operand (&ops[0], target);
 166   create_input_operand (&ops[1], reg, TYPE_MODE (type));
 167   expand_insn (get_multi_vector_move (type, optab), 2, ops);
 168 }
 169
 170 static void
 171 expand_ANNOTATE (internal_fn, gcall *)
 172 {
 173   gcc_unreachable ();
 174 }
 175
 176 /* This should get expanded in omp_device_lower pass.  */
 177
 178 static void
 179 expand_GOMP_USE_SIMT (internal_fn, gcall *)
 180 {
 181   gcc_unreachable ();
 182 }
 183
 184 /* This should get expanded in omp_device_lower pass.  */
 185
 186 static void
 187 expand_GOMP_SIMT_ENTER (internal_fn, gcall *)
 188 {
 189   gcc_unreachable ();
 190 }
 191
 192 /* Allocate per-lane storage and begin non-uniform execution region.  */
 193
 194 static void
 195 expand_GOMP_SIMT_ENTER_ALLOC (internal_fn, gcall *stmt)
 196 {
 197   rtx target;
 198   tree lhs = gimple_call_lhs (stmt);
 199   if (lhs)
 200     target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 201   else
 202     target = gen_reg_rtx (Pmode);
 203   rtx size = expand_normal (gimple_call_arg (stmt, 0));
 204   rtx align = expand_normal (gimple_call_arg (stmt, 1));
 205   struct expand_operand ops[3];
 206   create_output_operand (&ops[0], target, Pmode);
 207   create_input_operand (&ops[1], size, Pmode);
 208   create_input_operand (&ops[2], align, Pmode);
 209   gcc_assert (targetm.have_omp_simt_enter ());
 210   expand_insn (targetm.code_for_omp_simt_enter, 3, ops);
 211 }
 212
 213 /* Deallocate per-lane storage and leave non-uniform execution region.  */
 214
 215 static void
 216 expand_GOMP_SIMT_EXIT (internal_fn, gcall *stmt)
 217 {
 218   gcc_checking_assert (!gimple_call_lhs (stmt));
 219   rtx arg = expand_normal (gimple_call_arg (stmt, 0));
 220   struct expand_operand ops[1];
 221   create_input_operand (&ops[0], arg, Pmode);
 222   gcc_assert (targetm.have_omp_simt_exit ());
 223   expand_insn (targetm.code_for_omp_simt_exit, 1, ops);
 224 }
 225
 226 /* Lane index on SIMT targets: thread index in the warp on NVPTX.  On targets
 227    without SIMT execution this should be expanded in omp_device_lower pass.  */
 228
 229 static void
 230 expand_GOMP_SIMT_LANE (internal_fn, gcall *stmt)
 231 {
 232   tree lhs = gimple_call_lhs (stmt);
 233   if (!lhs)
 234     return;
 235
 236   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 237   gcc_assert (targetm.have_omp_simt_lane ());
 238   emit_insn (targetm.gen_omp_simt_lane (target));
 239 }
 240
 241 /* This should get expanded in omp_device_lower pass.  */
 242
 243 static void
 244 expand_GOMP_SIMT_VF (internal_fn, gcall *)
 245 {
 246   gcc_unreachable ();
 247 }
 248
 249 /* Lane index of the first SIMT lane that supplies a non-zero argument.
 250    This is a SIMT counterpart to GOMP_SIMD_LAST_LANE, used to represent the
 251    lane that executed the last iteration for handling OpenMP lastprivate.  */
 252
 253 static void
 254 expand_GOMP_SIMT_LAST_LANE (internal_fn, gcall *stmt)
 255 {
 256   tree lhs = gimple_call_lhs (stmt);
 257   if (!lhs)
 258     return;
 259
 260   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 261   rtx cond = expand_normal (gimple_call_arg (stmt, 0));
 262   machine_mode mode = TYPE_MODE (TREE_TYPE (lhs));
 263   struct expand_operand ops[2];
 264   create_output_operand (&ops[0], target, mode);
 265   create_input_operand (&ops[1], cond, mode);
 266   gcc_assert (targetm.have_omp_simt_last_lane ());
 267   expand_insn (targetm.code_for_omp_simt_last_lane, 2, ops);
 268 }
 269
 270 /* Non-transparent predicate used in SIMT lowering of OpenMP "ordered".  */
 271
 272 static void
 273 expand_GOMP_SIMT_ORDERED_PRED (internal_fn, gcall *stmt)
 274 {
 275   tree lhs = gimple_call_lhs (stmt);
 276   if (!lhs)
 277     return;
 278
 279   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 280   rtx ctr = expand_normal (gimple_call_arg (stmt, 0));
 281   machine_mode mode = TYPE_MODE (TREE_TYPE (lhs));
 282   struct expand_operand ops[2];
 283   create_output_operand (&ops[0], target, mode);
 284   create_input_operand (&ops[1], ctr, mode);
 285   gcc_assert (targetm.have_omp_simt_ordered ());
 286   expand_insn (targetm.code_for_omp_simt_ordered, 2, ops);
 287 }
 288
 289 /* "Or" boolean reduction across SIMT lanes: return non-zero in all lanes if
 290    any lane supplies a non-zero argument.  */
 291
 292 static void
 293 expand_GOMP_SIMT_VOTE_ANY (internal_fn, gcall *stmt)
 294 {
 295   tree lhs = gimple_call_lhs (stmt);
 296   if (!lhs)
 297     return;
 298
 299   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 300   rtx cond = expand_normal (gimple_call_arg (stmt, 0));
 301   machine_mode mode = TYPE_MODE (TREE_TYPE (lhs));
 302   struct expand_operand ops[2];
 303   create_output_operand (&ops[0], target, mode);
 304   create_input_operand (&ops[1], cond, mode);
 305   gcc_assert (targetm.have_omp_simt_vote_any ());
 306   expand_insn (targetm.code_for_omp_simt_vote_any, 2, ops);
 307 }
 308
 309 /* Exchange between SIMT lanes with a "butterfly" pattern: source lane index
 310    is destination lane index XOR given offset.  */
 311
 312 static void
 313 expand_GOMP_SIMT_XCHG_BFLY (internal_fn, gcall *stmt)
 314 {
 315   tree lhs = gimple_call_lhs (stmt);
 316   if (!lhs)
 317     return;
 318
 319   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 320   rtx src = expand_normal (gimple_call_arg (stmt, 0));
 321   rtx idx = expand_normal (gimple_call_arg (stmt, 1));
 322   machine_mode mode = TYPE_MODE (TREE_TYPE (lhs));
 323   struct expand_operand ops[3];
 324   create_output_operand (&ops[0], target, mode);
 325   create_input_operand (&ops[1], src, mode);
 326   create_input_operand (&ops[2], idx, SImode);
 327   gcc_assert (targetm.have_omp_simt_xchg_bfly ());
 328   expand_insn (targetm.code_for_omp_simt_xchg_bfly, 3, ops);
 329 }
 330
 331 /* Exchange between SIMT lanes according to given source lane index.  */
 332
 333 static void
 334 expand_GOMP_SIMT_XCHG_IDX (internal_fn, gcall *stmt)
 335 {
 336   tree lhs = gimple_call_lhs (stmt);
 337   if (!lhs)
 338     return;
 339
 340   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 341   rtx src = expand_normal (gimple_call_arg (stmt, 0));
 342   rtx idx = expand_normal (gimple_call_arg (stmt, 1));
 343   machine_mode mode = TYPE_MODE (TREE_TYPE (lhs));
 344   struct expand_operand ops[3];
 345   create_output_operand (&ops[0], target, mode);
 346   create_input_operand (&ops[1], src, mode);
 347   create_input_operand (&ops[2], idx, SImode);
 348   gcc_assert (targetm.have_omp_simt_xchg_idx ());
 349   expand_insn (targetm.code_for_omp_simt_xchg_idx, 3, ops);
 350 }
 351
 352 /* This should get expanded in adjust_simduid_builtins.  */
 353
 354 static void
 355 expand_GOMP_SIMD_LANE (internal_fn, gcall *)
 356 {
 357   gcc_unreachable ();
 358 }
 359
 360 /* This should get expanded in adjust_simduid_builtins.  */
 361
 362 static void
 363 expand_GOMP_SIMD_VF (internal_fn, gcall *)
 364 {
 365   gcc_unreachable ();
 366 }
 367
 368 /* This should get expanded in adjust_simduid_builtins.  */
 369
 370 static void
 371 expand_GOMP_SIMD_LAST_LANE (internal_fn, gcall *)
 372 {
 373   gcc_unreachable ();
 374 }
 375
 376 /* This should get expanded in adjust_simduid_builtins.  */
 377
 378 static void
 379 expand_GOMP_SIMD_ORDERED_START (internal_fn, gcall *)
 380 {
 381   gcc_unreachable ();
 382 }
 383
 384 /* This should get expanded in adjust_simduid_builtins.  */
 385
 386 static void
 387 expand_GOMP_SIMD_ORDERED_END (internal_fn, gcall *)
 388 {
 389   gcc_unreachable ();
 390 }
 391
 392 /* This should get expanded in the sanopt pass.  */
 393
 394 static void
 395 expand_UBSAN_NULL (internal_fn, gcall *)
 396 {
 397   gcc_unreachable ();
 398 }
 399
 400 /* This should get expanded in the sanopt pass.  */
 401
 402 static void
 403 expand_UBSAN_BOUNDS (internal_fn, gcall *)
 404 {
 405   gcc_unreachable ();
 406 }
 407
 408 /* This should get expanded in the sanopt pass.  */
 409
 410 static void
 411 expand_UBSAN_VPTR (internal_fn, gcall *)
 412 {
 413   gcc_unreachable ();
 414 }
 415
 416 /* This should get expanded in the sanopt pass.  */
 417
 418 static void
 419 expand_UBSAN_PTR (internal_fn, gcall *)
 420 {
 421   gcc_unreachable ();
 422 }
 423
 424 /* This should get expanded in the sanopt pass.  */
 425
 426 static void
 427 expand_UBSAN_OBJECT_SIZE (internal_fn, gcall *)
 428 {
 429   gcc_unreachable ();
 430 }
 431
 432 /* This should get expanded in the sanopt pass.  */
 433
 434 static void
 435 expand_ASAN_CHECK (internal_fn, gcall *)
 436 {
 437   gcc_unreachable ();
 438 }
 439
 440 /* This should get expanded in the sanopt pass.  */
 441
 442 static void
 443 expand_ASAN_MARK (internal_fn, gcall *)
 444 {
 445   gcc_unreachable ();
 446 }
 447
 448 /* This should get expanded in the sanopt pass.  */
 449
 450 static void
 451 expand_ASAN_POISON (internal_fn, gcall *)
 452 {
 453   gcc_unreachable ();
 454 }
 455
 456 /* This should get expanded in the sanopt pass.  */
 457
 458 static void
 459 expand_ASAN_POISON_USE (internal_fn, gcall *)
 460 {
 461   gcc_unreachable ();
 462 }
 463
 464 /* This should get expanded in the tsan pass.  */
 465
 466 static void
 467 expand_TSAN_FUNC_EXIT (internal_fn, gcall *)
 468 {
 469   gcc_unreachable ();
 470 }
 471
 472 /* This should get expanded in the lower pass.  */
 473
 474 static void
 475 expand_FALLTHROUGH (internal_fn, gcall *call)
 476 {
 477   error_at (gimple_location (call),
 478             "invalid use of attribute %<fallthrough%>");
 479 }
 480
 481 /* Return minimum precision needed to represent all values
 482    of ARG in SIGNed integral type.  */
 483
 484 static int
 485 get_min_precision (tree arg, signop sign)
 486 {
 487   int prec = TYPE_PRECISION (TREE_TYPE (arg));
 488   int cnt = 0;
 489   signop orig_sign = sign;
 490   if (TREE_CODE (arg) == INTEGER_CST)
 491     {
 492       int p;
 493       if (TYPE_SIGN (TREE_TYPE (arg)) != sign)
 494         {
 495           widest_int w = wi::to_widest (arg);
 496           w = wi::ext (w, prec, sign);
 497           p = wi::min_precision (w, sign);
 498         }
 499       else
 500         p = wi::min_precision (wi::to_wide (arg), sign);
 501       return MIN (p, prec);
 502     }
 503   while (CONVERT_EXPR_P (arg)
 504          && INTEGRAL_TYPE_P (TREE_TYPE (TREE_OPERAND (arg, 0)))
 505          && TYPE_PRECISION (TREE_TYPE (TREE_OPERAND (arg, 0))) <= prec)
 506     {
 507       arg = TREE_OPERAND (arg, 0);
 508       if (TYPE_PRECISION (TREE_TYPE (arg)) < prec)
 509         {
 510           if (TYPE_UNSIGNED (TREE_TYPE (arg)))
 511             sign = UNSIGNED;
 512           else if (sign == UNSIGNED && get_range_pos_neg (arg) != 1)
 513             return prec + (orig_sign != sign);
 514           prec = TYPE_PRECISION (TREE_TYPE (arg));
 515         }
 516       if (++cnt > 30)
 517         return prec + (orig_sign != sign);
 518     }
 519   if (TREE_CODE (arg) != SSA_NAME)
 520     return prec + (orig_sign != sign);
 521   wide_int arg_min, arg_max;
 522   while (get_range_info (arg, &arg_min, &arg_max) != VR_RANGE)
 523     {
 524       gimple *g = SSA_NAME_DEF_STMT (arg);
 525       if (is_gimple_assign (g)
 526           && CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (g)))
 527         {
 528           tree t = gimple_assign_rhs1 (g);
 529           if (INTEGRAL_TYPE_P (TREE_TYPE (t))
 530               && TYPE_PRECISION (TREE_TYPE (t)) <= prec)
 531             {
 532               arg = t;
 533               if (TYPE_PRECISION (TREE_TYPE (arg)) < prec)
 534                 {
 535                   if (TYPE_UNSIGNED (TREE_TYPE (arg)))
 536                     sign = UNSIGNED;
 537                   else if (sign == UNSIGNED && get_range_pos_neg (arg) != 1)
 538                     return prec + (orig_sign != sign);
 539                   prec = TYPE_PRECISION (TREE_TYPE (arg));
 540                 }
 541               if (++cnt > 30)
 542                 return prec + (orig_sign != sign);
 543               continue;
 544             }
 545         }
 546       return prec + (orig_sign != sign);
 547     }
 548   if (sign == TYPE_SIGN (TREE_TYPE (arg)))
 549     {
 550       int p1 = wi::min_precision (arg_min, sign);
 551       int p2 = wi::min_precision (arg_max, sign);
 552       p1 = MAX (p1, p2);
 553       prec = MIN (prec, p1);
 554     }
 555   else if (sign == UNSIGNED && !wi::neg_p (arg_min, SIGNED))
 556     {
 557       int p = wi::min_precision (arg_max, UNSIGNED);
 558       prec = MIN (prec, p);
 559     }
 560   return prec + (orig_sign != sign);
 561 }
 562
 563 /* Helper for expand_*_overflow.  Set the __imag__ part to true
 564    (1 except for signed:1 type, in which case store -1).  */
 565
 566 static void
 567 expand_arith_set_overflow (tree lhs, rtx target)
 568 {
 569   if (TYPE_PRECISION (TREE_TYPE (TREE_TYPE (lhs))) == 1
 570       && !TYPE_UNSIGNED (TREE_TYPE (TREE_TYPE (lhs))))
 571     write_complex_part (target, constm1_rtx, true);
 572   else
 573     write_complex_part (target, const1_rtx, true);
 574 }
 575
 576 /* Helper for expand_*_overflow.  Store RES into the __real__ part
 577    of TARGET.  If RES has larger MODE than __real__ part of TARGET,
 578    set the __imag__ part to 1 if RES doesn't fit into it.  Similarly
 579    if LHS has smaller precision than its mode.  */
 580
 581 static void
 582 expand_arith_overflow_result_store (tree lhs, rtx target,
 583                                     scalar_int_mode mode, rtx res)
 584 {
 585   scalar_int_mode tgtmode
 586     = as_a <scalar_int_mode> (GET_MODE_INNER (GET_MODE (target)));
 587   rtx lres = res;
 588   if (tgtmode != mode)
 589     {
 590       rtx_code_label *done_label = gen_label_rtx ();
 591       int uns = TYPE_UNSIGNED (TREE_TYPE (TREE_TYPE (lhs)));
 592       lres = convert_modes (tgtmode, mode, res, uns);
 593       gcc_assert (GET_MODE_PRECISION (tgtmode) < GET_MODE_PRECISION (mode));
 594       do_compare_rtx_and_jump (res, convert_modes (mode, tgtmode, lres, uns),
 595                                EQ, true, mode, NULL_RTX, NULL, done_label,
 596                                profile_probability::very_likely ());
 597       expand_arith_set_overflow (lhs, target);
 598       emit_label (done_label);
 599     }
 600   int prec = TYPE_PRECISION (TREE_TYPE (TREE_TYPE (lhs)));
 601   int tgtprec = GET_MODE_PRECISION (tgtmode);
 602   if (prec < tgtprec)
 603     {
 604       rtx_code_label *done_label = gen_label_rtx ();
 605       int uns = TYPE_UNSIGNED (TREE_TYPE (TREE_TYPE (lhs)));
 606       res = lres;
 607       if (uns)
 608         {
 609           rtx mask
 610             = immed_wide_int_const (wi::shifted_mask (0, prec, false, tgtprec),
 611                                     tgtmode);
 612           lres = expand_simple_binop (tgtmode, AND, res, mask, NULL_RTX,
 613                                       true, OPTAB_LIB_WIDEN);
 614         }
 615       else
 616         {
 617           lres = expand_shift (LSHIFT_EXPR, tgtmode, res, tgtprec - prec,
 618                                NULL_RTX, 1);
 619           lres = expand_shift (RSHIFT_EXPR, tgtmode, lres, tgtprec - prec,
 620                                NULL_RTX, 0);
 621         }
 622       do_compare_rtx_and_jump (res, lres,
 623                                EQ, true, tgtmode, NULL_RTX, NULL, done_label,
 624                                profile_probability::very_likely ());
 625       expand_arith_set_overflow (lhs, target);
 626       emit_label (done_label);
 627     }
 628   write_complex_part (target, lres, false);
 629 }
 630
 631 /* Helper for expand_*_overflow.  Store RES into TARGET.  */
 632
 633 static void
 634 expand_ubsan_result_store (rtx target, rtx res)
 635 {
 636   if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
 637     /* If this is a scalar in a register that is stored in a wider mode
 638        than the declared mode, compute the result into its declared mode
 639        and then convert to the wider mode.  Our value is the computed
 640        expression.  */
 641     convert_move (SUBREG_REG (target), res, SUBREG_PROMOTED_SIGN (target));
 642   else
 643     emit_move_insn (target, res);
 644 }
 645
 646 /* Add sub/add overflow checking to the statement STMT.
 647    CODE says whether the operation is +, or -.  */
 648
 649 static void
 650 expand_addsub_overflow (location_t loc, tree_code code, tree lhs,
 651                         tree arg0, tree arg1, bool unsr_p, bool uns0_p,
 652                         bool uns1_p, bool is_ubsan, tree *datap)
 653 {
 654   rtx res, target = NULL_RTX;
 655   tree fn;
 656   rtx_code_label *done_label = gen_label_rtx ();
 657   rtx_code_label *do_error = gen_label_rtx ();
 658   do_pending_stack_adjust ();
 659   rtx op0 = expand_normal (arg0);
 660   rtx op1 = expand_normal (arg1);
 661   scalar_int_mode mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (arg0));
 662   int prec = GET_MODE_PRECISION (mode);
 663   rtx sgn = immed_wide_int_const (wi::min_value (prec, SIGNED), mode);
 664   bool do_xor = false;
 665
 666   if (is_ubsan)
 667     gcc_assert (!unsr_p && !uns0_p && !uns1_p);
 668
 669   if (lhs)
 670     {
 671       target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
 672       if (!is_ubsan)
 673         write_complex_part (target, const0_rtx, true);
 674     }
 675
 676   /* We assume both operands and result have the same precision
 677      here (GET_MODE_BITSIZE (mode)), S stands for signed type
 678      with that precision, U for unsigned type with that precision,
 679      sgn for unsigned most significant bit in that precision.
 680      s1 is signed first operand, u1 is unsigned first operand,
 681      s2 is signed second operand, u2 is unsigned second operand,
 682      sr is signed result, ur is unsigned result and the following
 683      rules say how to compute result (which is always result of
 684      the operands as if both were unsigned, cast to the right
 685      signedness) and how to compute whether operation overflowed.
 686
 687      s1 + s2 -> sr
 688         res = (S) ((U) s1 + (U) s2)
 689         ovf = s2 < 0 ? res > s1 : res < s1 (or jump on overflow)
 690      s1 - s2 -> sr
 691         res = (S) ((U) s1 - (U) s2)
 692         ovf = s2 < 0 ? res < s1 : res > s2 (or jump on overflow)
 693      u1 + u2 -> ur
 694         res = u1 + u2
 695         ovf = res < u1 (or jump on carry, but RTL opts will handle it)
 696      u1 - u2 -> ur
 697         res = u1 - u2
 698         ovf = res > u1 (or jump on carry, but RTL opts will handle it)
 699      s1 + u2 -> sr
 700         res = (S) ((U) s1 + u2)
 701         ovf = ((U) res ^ sgn) < u2
 702      s1 + u2 -> ur
 703         t1 = (S) (u2 ^ sgn)
 704         t2 = s1 + t1
 705         res = (U) t2 ^ sgn
 706         ovf = t1 < 0 ? t2 > s1 : t2 < s1 (or jump on overflow)
 707      s1 - u2 -> sr
 708         res = (S) ((U) s1 - u2)
 709         ovf = u2 > ((U) s1 ^ sgn)
 710      s1 - u2 -> ur
 711         res = (U) s1 - u2
 712         ovf = s1 < 0 || u2 > (U) s1
 713      u1 - s2 -> sr
 714         res = u1 - (U) s2
 715         ovf = u1 >= ((U) s2 ^ sgn)
 716      u1 - s2 -> ur
 717         t1 = u1 ^ sgn
 718         t2 = t1 - (U) s2
 719         res = t2 ^ sgn
 720         ovf = s2 < 0 ? (S) t2 < (S) t1 : (S) t2 > (S) t1 (or jump on overflow)
 721      s1 + s2 -> ur
 722         res = (U) s1 + (U) s2
 723         ovf = s2 < 0 ? (s1 | (S) res) < 0) : (s1 & (S) res) < 0)
 724      u1 + u2 -> sr
 725         res = (S) (u1 + u2)
 726         ovf = (U) res < u2 || res < 0
 727      u1 - u2 -> sr
 728         res = (S) (u1 - u2)
 729         ovf = u1 >= u2 ? res < 0 : res >= 0
 730      s1 - s2 -> ur
 731         res = (U) s1 - (U) s2
 732         ovf = s2 >= 0 ? ((s1 | (S) res) < 0) : ((s1 & (S) res) < 0)  */
 733
 734   if (code == PLUS_EXPR && uns0_p && !uns1_p)
 735     {
 736       /* PLUS_EXPR is commutative, if operand signedness differs,
 737          canonicalize to the first operand being signed and second
 738          unsigned to simplify following code.  */
 739       std::swap (op0, op1);
 740       std::swap (arg0, arg1);
 741       uns0_p = false;
 742       uns1_p = true;
 743     }
 744
 745   /* u1 +- u2 -> ur  */
 746   if (uns0_p && uns1_p && unsr_p)
 747     {
 748       insn_code icode = optab_handler (code == PLUS_EXPR ? uaddv4_optab
 749                                        : usubv4_optab, mode);
 750       if (icode != CODE_FOR_nothing)
 751         {
 752           struct expand_operand ops[4];
 753           rtx_insn *last = get_last_insn ();
 754
 755           res = gen_reg_rtx (mode);
 756           create_output_operand (&ops[0], res, mode);
 757           create_input_operand (&ops[1], op0, mode);
 758           create_input_operand (&ops[2], op1, mode);
 759           create_fixed_operand (&ops[3], do_error);
 760           if (maybe_expand_insn (icode, 4, ops))
 761             {
 762               last = get_last_insn ();
 763               if (profile_status_for_fn (cfun) != PROFILE_ABSENT
 764                   && JUMP_P (last)
 765                   && any_condjump_p (last)
 766                   && !find_reg_note (last, REG_BR_PROB, 0))
 767                 add_reg_br_prob_note (last,
 768                                       profile_probability::very_unlikely ());
 769               emit_jump (done_label);
 770               goto do_error_label;
 771             }
 772
 773           delete_insns_since (last);
 774         }
 775
 776       /* Compute the operation.  On RTL level, the addition is always
 777          unsigned.  */
 778       res = expand_binop (mode, code == PLUS_EXPR ? add_optab : sub_optab,
 779                           op0, op1, NULL_RTX, false, OPTAB_LIB_WIDEN);
 780       rtx tem = op0;
 781       /* For PLUS_EXPR, the operation is commutative, so we can pick
 782          operand to compare against.  For prec <= BITS_PER_WORD, I think
 783          preferring REG operand is better over CONST_INT, because
 784          the CONST_INT might enlarge the instruction or CSE would need
 785          to figure out we'd already loaded it into a register before.
 786          For prec > BITS_PER_WORD, I think CONST_INT might be more beneficial,
 787          as then the multi-word comparison can be perhaps simplified.  */
 788       if (code == PLUS_EXPR
 789           && (prec <= BITS_PER_WORD
 790               ? (CONST_SCALAR_INT_P (op0) && REG_P (op1))
 791               : CONST_SCALAR_INT_P (op1)))
 792         tem = op1;
 793       do_compare_rtx_and_jump (res, tem, code == PLUS_EXPR ? GEU : LEU,
 794                                true, mode, NULL_RTX, NULL, done_label,
 795                                profile_probability::very_likely ());
 796       goto do_error_label;
 797     }
 798
 799   /* s1 +- u2 -> sr  */
 800   if (!uns0_p && uns1_p && !unsr_p)
 801     {
 802       /* Compute the operation.  On RTL level, the addition is always
 803          unsigned.  */
 804       res = expand_binop (mode, code == PLUS_EXPR ? add_optab : sub_optab,
 805                           op0, op1, NULL_RTX, false, OPTAB_LIB_WIDEN);
 806       rtx tem = expand_binop (mode, add_optab,
 807                               code == PLUS_EXPR ? res : op0, sgn,
 808                               NULL_RTX, false, OPTAB_LIB_WIDEN);
 809       do_compare_rtx_and_jump (tem, op1, GEU, true, mode, NULL_RTX, NULL,
 810                                done_label, profile_probability::very_likely ());
 811       goto do_error_label;
 812     }
 813
 814   /* s1 + u2 -> ur  */
 815   if (code == PLUS_EXPR && !uns0_p && uns1_p && unsr_p)
 816     {
 817       op1 = expand_binop (mode, add_optab, op1, sgn, NULL_RTX, false,
 818                           OPTAB_LIB_WIDEN);
 819       /* As we've changed op1, we have to avoid using the value range
 820          for the original argument.  */
 821       arg1 = error_mark_node;
 822       do_xor = true;
 823       goto do_signed;
 824     }
 825
 826   /* u1 - s2 -> ur  */
 827   if (code == MINUS_EXPR && uns0_p && !uns1_p && unsr_p)
 828     {
 829       op0 = expand_binop (mode, add_optab, op0, sgn, NULL_RTX, false,
 830                           OPTAB_LIB_WIDEN);
 831       /* As we've changed op0, we have to avoid using the value range
 832          for the original argument.  */
 833       arg0 = error_mark_node;
 834       do_xor = true;
 835       goto do_signed;
 836     }
 837
 838   /* s1 - u2 -> ur  */
 839   if (code == MINUS_EXPR && !uns0_p && uns1_p && unsr_p)
 840     {
 841       /* Compute the operation.  On RTL level, the addition is always
 842          unsigned.  */
 843       res = expand_binop (mode, sub_optab, op0, op1, NULL_RTX, false,
 844                           OPTAB_LIB_WIDEN);
 845       int pos_neg = get_range_pos_neg (arg0);
 846       if (pos_neg == 2)
 847         /* If ARG0 is known to be always negative, this is always overflow.  */
 848         emit_jump (do_error);
 849       else if (pos_neg == 3)
 850         /* If ARG0 is not known to be always positive, check at runtime.  */
 851         do_compare_rtx_and_jump (op0, const0_rtx, LT, false, mode, NULL_RTX,
 852                                  NULL, do_error, profile_probability::very_unlikely ());
 853       do_compare_rtx_and_jump (op1, op0, LEU, true, mode, NULL_RTX, NULL,
 854                                done_label, profile_probability::very_likely ());
 855       goto do_error_label;
 856     }
 857
 858   /* u1 - s2 -> sr  */
 859   if (code == MINUS_EXPR && uns0_p && !uns1_p && !unsr_p)
 860     {
 861       /* Compute the operation.  On RTL level, the addition is always
 862          unsigned.  */
 863       res = expand_binop (mode, sub_optab, op0, op1, NULL_RTX, false,
 864                           OPTAB_LIB_WIDEN);
 865       rtx tem = expand_binop (mode, add_optab, op1, sgn, NULL_RTX, false,
 866                               OPTAB_LIB_WIDEN);
 867       do_compare_rtx_and_jump (op0, tem, LTU, true, mode, NULL_RTX, NULL,
 868                                done_label, profile_probability::very_likely ());
 869       goto do_error_label;
 870     }
 871
 872   /* u1 + u2 -> sr  */
 873   if (code == PLUS_EXPR && uns0_p && uns1_p && !unsr_p)
 874     {
 875       /* Compute the operation.  On RTL level, the addition is always
 876          unsigned.  */
 877       res = expand_binop (mode, add_optab, op0, op1, NULL_RTX, false,
 878                           OPTAB_LIB_WIDEN);
 879       do_compare_rtx_and_jump (res, const0_rtx, LT, false, mode, NULL_RTX,
 880                                NULL, do_error, profile_probability::very_unlikely ());
 881       rtx tem = op1;
 882       /* The operation is commutative, so we can pick operand to compare
 883          against.  For prec <= BITS_PER_WORD, I think preferring REG operand
 884          is better over CONST_INT, because the CONST_INT might enlarge the
 885          instruction or CSE would need to figure out we'd already loaded it
 886          into a register before.  For prec > BITS_PER_WORD, I think CONST_INT
 887          might be more beneficial, as then the multi-word comparison can be
 888          perhaps simplified.  */
 889       if (prec <= BITS_PER_WORD
 890           ? (CONST_SCALAR_INT_P (op1) && REG_P (op0))
 891           : CONST_SCALAR_INT_P (op0))
 892         tem = op0;
 893       do_compare_rtx_and_jump (res, tem, GEU, true, mode, NULL_RTX, NULL,
 894                                done_label, profile_probability::very_likely ());
 895       goto do_error_label;
 896     }
 897
 898   /* s1 +- s2 -> ur  */
 899   if (!uns0_p && !uns1_p && unsr_p)
 900     {
 901       /* Compute the operation.  On RTL level, the addition is always
 902          unsigned.  */
 903       res = expand_binop (mode, code == PLUS_EXPR ? add_optab : sub_optab,
 904                           op0, op1, NULL_RTX, false, OPTAB_LIB_WIDEN);
 905       int pos_neg = get_range_pos_neg (arg1);
 906       if (code == PLUS_EXPR)
 907         {
 908           int pos_neg0 = get_range_pos_neg (arg0);
 909           if (pos_neg0 != 3 && pos_neg == 3)
 910             {
 911               std::swap (op0, op1);
 912               pos_neg = pos_neg0;
 913             }
 914         }
 915       rtx tem;
 916       if (pos_neg != 3)
 917         {
 918           tem = expand_binop (mode, ((pos_neg == 1) ^ (code == MINUS_EXPR))
 919                                     ? and_optab : ior_optab,
 920                               op0, res, NULL_RTX, false, OPTAB_LIB_WIDEN);
 921           do_compare_rtx_and_jump (tem, const0_rtx, GE, false, mode, NULL,
 922                                    NULL, done_label, profile_probability::very_likely ());
 923         }
 924       else
 925         {
 926           rtx_code_label *do_ior_label = gen_label_rtx ();
 927           do_compare_rtx_and_jump (op1, const0_rtx,
 928                                    code == MINUS_EXPR ? GE : LT, false, mode,
 929                                    NULL_RTX, NULL, do_ior_label,
 930                                    profile_probability::even ());
 931           tem = expand_binop (mode, and_optab, op0, res, NULL_RTX, false,
 932                               OPTAB_LIB_WIDEN);
 933           do_compare_rtx_and_jump (tem, const0_rtx, GE, false, mode, NULL_RTX,
 934                                    NULL, done_label, profile_probability::very_likely ());
 935           emit_jump (do_error);
 936           emit_label (do_ior_label);
 937           tem = expand_binop (mode, ior_optab, op0, res, NULL_RTX, false,
 938                               OPTAB_LIB_WIDEN);
 939           do_compare_rtx_and_jump (tem, const0_rtx, GE, false, mode, NULL_RTX,
 940                                    NULL, done_label, profile_probability::very_likely ());
 941         }
 942       goto do_error_label;
 943     }
 944
 945   /* u1 - u2 -> sr  */
 946   if (code == MINUS_EXPR && uns0_p && uns1_p && !unsr_p)
 947     {
 948       /* Compute the operation.  On RTL level, the addition is always
 949          unsigned.  */
 950       res = expand_binop (mode, sub_optab, op0, op1, NULL_RTX, false,
 951                           OPTAB_LIB_WIDEN);
 952       rtx_code_label *op0_geu_op1 = gen_label_rtx ();
 953       do_compare_rtx_and_jump (op0, op1, GEU, true, mode, NULL_RTX, NULL,
 954                                op0_geu_op1, profile_probability::even ());
 955       do_compare_rtx_and_jump (res, const0_rtx, LT, false, mode, NULL_RTX,
 956                                NULL, done_label, profile_probability::very_likely ());
 957       emit_jump (do_error);
 958       emit_label (op0_geu_op1);
 959       do_compare_rtx_and_jump (res, const0_rtx, GE, false, mode, NULL_RTX,
 960                                NULL, done_label, profile_probability::very_likely ());
 961       goto do_error_label;
 962     }
 963
 964   gcc_assert (!uns0_p && !uns1_p && !unsr_p);
 965
 966   /* s1 +- s2 -> sr  */
 967  do_signed:
 968   {
 969     insn_code icode = optab_handler (code == PLUS_EXPR ? addv4_optab
 970                                      : subv4_optab, mode);
 971     if (icode != CODE_FOR_nothing)
 972       {
 973         struct expand_operand ops[4];
 974         rtx_insn *last = get_last_insn ();
 975
 976         res = gen_reg_rtx (mode);
 977         create_output_operand (&ops[0], res, mode);
 978         create_input_operand (&ops[1], op0, mode);
 979         create_input_operand (&ops[2], op1, mode);
 980         create_fixed_operand (&ops[3], do_error);
 981         if (maybe_expand_insn (icode, 4, ops))
 982           {
 983             last = get_last_insn ();
 984             if (profile_status_for_fn (cfun) != PROFILE_ABSENT
 985                 && JUMP_P (last)
 986                 && any_condjump_p (last)
 987                 && !find_reg_note (last, REG_BR_PROB, 0))
 988               add_reg_br_prob_note (last,
 989                                     profile_probability::very_unlikely ());
 990             emit_jump (done_label);
 991             goto do_error_label;
 992           }
 993
 994         delete_insns_since (last);
 995       }
 996
 997     /* Compute the operation.  On RTL level, the addition is always
 998        unsigned.  */
 999     res = expand_binop (mode, code == PLUS_EXPR ? add_optab : sub_optab,
1000                         op0, op1, NULL_RTX, false, OPTAB_LIB_WIDEN);
1001
1002     /* If we can prove that one of the arguments (for MINUS_EXPR only
1003        the second operand, as subtraction is not commutative) is always
1004        non-negative or always negative, we can do just one comparison
1005        and conditional jump.  */
1006     int pos_neg = get_range_pos_neg (arg1);
1007     if (code == PLUS_EXPR)
1008       {
1009         int pos_neg0 = get_range_pos_neg (arg0);
1010         if (pos_neg0 != 3 && pos_neg == 3)
1011           {
1012             std::swap (op0, op1);
1013             pos_neg = pos_neg0;
1014           }
1015       }
1016
1017     /* Addition overflows if and only if the two operands have the same sign,
1018        and the result has the opposite sign.  Subtraction overflows if and
1019        only if the two operands have opposite sign, and the subtrahend has
1020        the same sign as the result.  Here 0 is counted as positive.  */
1021     if (pos_neg == 3)
1022       {
1023         /* Compute op0 ^ op1 (operands have opposite sign).  */
1024         rtx op_xor = expand_binop (mode, xor_optab, op0, op1, NULL_RTX, false,
1025                                    OPTAB_LIB_WIDEN);
1026
1027         /* Compute res ^ op1 (result and 2nd operand have opposite sign).  */
1028         rtx res_xor = expand_binop (mode, xor_optab, res, op1, NULL_RTX, false,
1029                                     OPTAB_LIB_WIDEN);
1030
1031         rtx tem;
1032         if (code == PLUS_EXPR)
1033           {
1034             /* Compute (res ^ op1) & ~(op0 ^ op1).  */
1035             tem = expand_unop (mode, one_cmpl_optab, op_xor, NULL_RTX, false);
1036             tem = expand_binop (mode, and_optab, res_xor, tem, NULL_RTX, false,
1037                                 OPTAB_LIB_WIDEN);
1038           }
1039         else
1040           {
1041             /* Compute (op0 ^ op1) & ~(res ^ op1).  */
1042             tem = expand_unop (mode, one_cmpl_optab, res_xor, NULL_RTX, false);
1043             tem = expand_binop (mode, and_optab, op_xor, tem, NULL_RTX, false,
1044                                 OPTAB_LIB_WIDEN);
1045           }
1046
1047         /* No overflow if the result has bit sign cleared.  */
1048         do_compare_rtx_and_jump (tem, const0_rtx, GE, false, mode, NULL_RTX,
1049                                  NULL, done_label, profile_probability::very_likely ());
1050       }
1051
1052     /* Compare the result of the operation with the first operand.
1053        No overflow for addition if second operand is positive and result
1054        is larger or second operand is negative and result is smaller.
1055        Likewise for subtraction with sign of second operand flipped.  */
1056     else
1057       do_compare_rtx_and_jump (res, op0,
1058                                (pos_neg == 1) ^ (code == MINUS_EXPR) ? GE : LE,
1059                                false, mode, NULL_RTX, NULL, done_label,
1060                                profile_probability::very_likely ());
1061   }
1062
1063  do_error_label:
1064   emit_label (do_error);
1065   if (is_ubsan)
1066     {
1067       /* Expand the ubsan builtin call.  */
1068       push_temp_slots ();
1069       fn = ubsan_build_overflow_builtin (code, loc, TREE_TYPE (arg0),
1070                                          arg0, arg1, datap);
1071       expand_normal (fn);
1072       pop_temp_slots ();
1073       do_pending_stack_adjust ();
1074     }
1075   else if (lhs)
1076     expand_arith_set_overflow (lhs, target);
1077
1078   /* We're done.  */
1079   emit_label (done_label);
1080
1081   if (lhs)
1082     {
1083       if (is_ubsan)
1084         expand_ubsan_result_store (target, res);
1085       else
1086         {
1087           if (do_xor)
1088             res = expand_binop (mode, add_optab, res, sgn, NULL_RTX, false,
1089                                 OPTAB_LIB_WIDEN);
1090
1091           expand_arith_overflow_result_store (lhs, target, mode, res);
1092         }
1093     }
1094 }
1095
1096 /* Add negate overflow checking to the statement STMT.  */
1097
1098 static void
1099 expand_neg_overflow (location_t loc, tree lhs, tree arg1, bool is_ubsan,
1100                      tree *datap)
1101 {
1102   rtx res, op1;
1103   tree fn;
1104   rtx_code_label *done_label, *do_error;
1105   rtx target = NULL_RTX;
1106
1107   done_label = gen_label_rtx ();
1108   do_error = gen_label_rtx ();
1109
1110   do_pending_stack_adjust ();
1111   op1 = expand_normal (arg1);
1112
1113   scalar_int_mode mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (arg1));
1114   if (lhs)
1115     {
1116       target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
1117       if (!is_ubsan)
1118         write_complex_part (target, const0_rtx, true);
1119     }
1120
1121   enum insn_code icode = optab_handler (negv3_optab, mode);
1122   if (icode != CODE_FOR_nothing)
1123     {
1124       struct expand_operand ops[3];
1125       rtx_insn *last = get_last_insn ();
1126
1127       res = gen_reg_rtx (mode);
1128       create_output_operand (&ops[0], res, mode);
1129       create_input_operand (&ops[1], op1, mode);
1130       create_fixed_operand (&ops[2], do_error);
1131       if (maybe_expand_insn (icode, 3, ops))
1132         {
1133           last = get_last_insn ();
1134           if (profile_status_for_fn (cfun) != PROFILE_ABSENT
1135               && JUMP_P (last)
1136               && any_condjump_p (last)
1137               && !find_reg_note (last, REG_BR_PROB, 0))
1138             add_reg_br_prob_note (last,
1139                                   profile_probability::very_unlikely ());
1140           emit_jump (done_label);
1141         }
1142       else
1143         {
1144           delete_insns_since (last);
1145           icode = CODE_FOR_nothing;
1146         }
1147     }
1148
1149   if (icode == CODE_FOR_nothing)
1150     {
1151       /* Compute the operation.  On RTL level, the addition is always
1152          unsigned.  */
1153       res = expand_unop (mode, neg_optab, op1, NULL_RTX, false);
1154
1155       /* Compare the operand with the most negative value.  */
1156       rtx minv = expand_normal (TYPE_MIN_VALUE (TREE_TYPE (arg1)));
1157       do_compare_rtx_and_jump (op1, minv, NE, true, mode, NULL_RTX, NULL,
1158                                done_label, profile_probability::very_likely ());
1159     }
1160
1161   emit_label (do_error);
1162   if (is_ubsan)
1163     {
1164       /* Expand the ubsan builtin call.  */
1165       push_temp_slots ();
1166       fn = ubsan_build_overflow_builtin (NEGATE_EXPR, loc, TREE_TYPE (arg1),
1167                                          arg1, NULL_TREE, datap);
1168       expand_normal (fn);
1169       pop_temp_slots ();
1170       do_pending_stack_adjust ();
1171     }
1172   else if (lhs)
1173     expand_arith_set_overflow (lhs, target);
1174
1175   /* We're done.  */
1176   emit_label (done_label);
1177
1178   if (lhs)
1179     {
1180       if (is_ubsan)
1181         expand_ubsan_result_store (target, res);
1182       else
1183         expand_arith_overflow_result_store (lhs, target, mode, res);
1184     }
1185 }
1186
1187 /* Return true if UNS WIDEN_MULT_EXPR with result mode WMODE and operand
1188    mode MODE can be expanded without using a libcall.  */
1189
1190 static bool
1191 can_widen_mult_without_libcall (scalar_int_mode wmode, scalar_int_mode mode,
1192                                 rtx op0, rtx op1, bool uns)
1193 {
1194   if (find_widening_optab_handler (umul_widen_optab, wmode, mode)
1195       != CODE_FOR_nothing)
1196     return true;
1197
1198   if (find_widening_optab_handler (smul_widen_optab, wmode, mode)
1199       != CODE_FOR_nothing)
1200     return true;
1201
1202   rtx_insn *last = get_last_insn ();
1203   if (CONSTANT_P (op0))
1204     op0 = convert_modes (wmode, mode, op0, uns);
1205   else
1206     op0 = gen_raw_REG (wmode, LAST_VIRTUAL_REGISTER + 1);
1207   if (CONSTANT_P (op1))
1208     op1 = convert_modes (wmode, mode, op1, uns);
1209   else
1210     op1 = gen_raw_REG (wmode, LAST_VIRTUAL_REGISTER + 2);
1211   rtx ret = expand_mult (wmode, op0, op1, NULL_RTX, uns, true);
1212   delete_insns_since (last);
1213   return ret != NULL_RTX;
1214 }
1215
1216 /* Add mul overflow checking to the statement STMT.  */
1217
1218 static void
1219 expand_mul_overflow (location_t loc, tree lhs, tree arg0, tree arg1,
1220                      bool unsr_p, bool uns0_p, bool uns1_p, bool is_ubsan,
1221                      tree *datap)
1222 {
1223   rtx res, op0, op1;
1224   tree fn, type;
1225   rtx_code_label *done_label, *do_error;
1226   rtx target = NULL_RTX;
1227   signop sign;
1228   enum insn_code icode;
1229
1230   done_label = gen_label_rtx ();
1231   do_error = gen_label_rtx ();
1232
1233   do_pending_stack_adjust ();
1234   op0 = expand_normal (arg0);
1235   op1 = expand_normal (arg1);
1236
1237   scalar_int_mode mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (arg0));
1238   bool uns = unsr_p;
1239   if (lhs)
1240     {
1241       target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
1242       if (!is_ubsan)
1243         write_complex_part (target, const0_rtx, true);
1244     }
1245
1246   if (is_ubsan)
1247     gcc_assert (!unsr_p && !uns0_p && !uns1_p);
1248
1249   /* We assume both operands and result have the same precision
1250      here (GET_MODE_BITSIZE (mode)), S stands for signed type
1251      with that precision, U for unsigned type with that precision,
1252      sgn for unsigned most significant bit in that precision.
1253      s1 is signed first operand, u1 is unsigned first operand,
1254      s2 is signed second operand, u2 is unsigned second operand,
1255      sr is signed result, ur is unsigned result and the following
1256      rules say how to compute result (which is always result of
1257      the operands as if both were unsigned, cast to the right
1258      signedness) and how to compute whether operation overflowed.
1259      main_ovf (false) stands for jump on signed multiplication
1260      overflow or the main algorithm with uns == false.
1261      main_ovf (true) stands for jump on unsigned multiplication
1262      overflow or the main algorithm with uns == true.
1263
1264      s1 * s2 -> sr
1265         res = (S) ((U) s1 * (U) s2)
1266         ovf = main_ovf (false)
1267      u1 * u2 -> ur
1268         res = u1 * u2
1269         ovf = main_ovf (true)
1270      s1 * u2 -> ur
1271         res = (U) s1 * u2
1272         ovf = (s1 < 0 && u2) || main_ovf (true)
1273      u1 * u2 -> sr
1274         res = (S) (u1 * u2)
1275         ovf = res < 0 || main_ovf (true)
1276      s1 * u2 -> sr
1277         res = (S) ((U) s1 * u2)
1278         ovf = (S) u2 >= 0 ? main_ovf (false)
1279                           : (s1 != 0 && (s1 != -1 || u2 != (U) res))
1280      s1 * s2 -> ur
1281         t1 = (s1 & s2) < 0 ? (-(U) s1) : ((U) s1)
1282         t2 = (s1 & s2) < 0 ? (-(U) s2) : ((U) s2)
1283         res = t1 * t2
1284         ovf = (s1 ^ s2) < 0 ? (s1 && s2) : main_ovf (true)  */
1285
1286   if (uns0_p && !uns1_p)
1287     {
1288       /* Multiplication is commutative, if operand signedness differs,
1289          canonicalize to the first operand being signed and second
1290          unsigned to simplify following code.  */
1291       std::swap (op0, op1);
1292       std::swap (arg0, arg1);
1293       uns0_p = false;
1294       uns1_p = true;
1295     }
1296
1297   int pos_neg0 = get_range_pos_neg (arg0);
1298   int pos_neg1 = get_range_pos_neg (arg1);
1299
1300   /* s1 * u2 -> ur  */
1301   if (!uns0_p && uns1_p && unsr_p)
1302     {
1303       switch (pos_neg0)
1304         {
1305         case 1:
1306           /* If s1 is non-negative, just perform normal u1 * u2 -> ur.  */
1307           goto do_main;
1308         case 2:
1309           /* If s1 is negative, avoid the main code, just multiply and
1310              signal overflow if op1 is not 0.  */
1311           struct separate_ops ops;
1312           ops.code = MULT_EXPR;
1313           ops.type = TREE_TYPE (arg1);
1314           ops.op0 = make_tree (ops.type, op0);
1315           ops.op1 = make_tree (ops.type, op1);
1316           ops.op2 = NULL_TREE;
1317           ops.location = loc;
1318           res = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1319           do_compare_rtx_and_jump (op1, const0_rtx, EQ, true, mode, NULL_RTX,
1320                                    NULL, done_label, profile_probability::very_likely ());
1321           goto do_error_label;
1322         case 3:
1323           rtx_code_label *do_main_label;
1324           do_main_label = gen_label_rtx ();
1325           do_compare_rtx_and_jump (op0, const0_rtx, GE, false, mode, NULL_RTX,
1326                                    NULL, do_main_label, profile_probability::very_likely ());
1327           do_compare_rtx_and_jump (op1, const0_rtx, EQ, true, mode, NULL_RTX,
1328                                    NULL, do_main_label, profile_probability::very_likely ());
1329           expand_arith_set_overflow (lhs, target);
1330           emit_label (do_main_label);
1331           goto do_main;
1332         default:
1333           gcc_unreachable ();
1334         }
1335     }
1336
1337   /* u1 * u2 -> sr  */
1338   if (uns0_p && uns1_p && !unsr_p)
1339     {
1340       uns = true;
1341       /* Rest of handling of this case after res is computed.  */
1342       goto do_main;
1343     }
1344
1345   /* s1 * u2 -> sr  */
1346   if (!uns0_p && uns1_p && !unsr_p)
1347     {
1348       switch (pos_neg1)
1349         {
1350         case 1:
1351           goto do_main;
1352         case 2:
1353           /* If (S) u2 is negative (i.e. u2 is larger than maximum of S,
1354              avoid the main code, just multiply and signal overflow
1355              unless 0 * u2 or -1 * ((U) Smin).  */
1356           struct separate_ops ops;
1357           ops.code = MULT_EXPR;
1358           ops.type = TREE_TYPE (arg1);
1359           ops.op0 = make_tree (ops.type, op0);
1360           ops.op1 = make_tree (ops.type, op1);
1361           ops.op2 = NULL_TREE;
1362           ops.location = loc;
1363           res = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1364           do_compare_rtx_and_jump (op0, const0_rtx, EQ, true, mode, NULL_RTX,
1365                                    NULL, done_label, profile_probability::very_likely ());
1366           do_compare_rtx_and_jump (op0, constm1_rtx, NE, true, mode, NULL_RTX,
1367                                    NULL, do_error, profile_probability::very_unlikely ());
1368           int prec;
1369           prec = GET_MODE_PRECISION (mode);
1370           rtx sgn;
1371           sgn = immed_wide_int_const (wi::min_value (prec, SIGNED), mode);
1372           do_compare_rtx_and_jump (op1, sgn, EQ, true, mode, NULL_RTX,
1373                                    NULL, done_label, profile_probability::very_likely ());
1374           goto do_error_label;
1375         case 3:
1376           /* Rest of handling of this case after res is computed.  */
1377           goto do_main;
1378         default:
1379           gcc_unreachable ();
1380         }
1381     }
1382
1383   /* s1 * s2 -> ur  */
1384   if (!uns0_p && !uns1_p && unsr_p)
1385     {
1386       rtx tem, tem2;
1387       switch (pos_neg0 | pos_neg1)
1388         {
1389         case 1: /* Both operands known to be non-negative.  */
1390           goto do_main;
1391         case 2: /* Both operands known to be negative.  */
1392           op0 = expand_unop (mode, neg_optab, op0, NULL_RTX, false);
1393           op1 = expand_unop (mode, neg_optab, op1, NULL_RTX, false);
1394           /* Avoid looking at arg0/arg1 ranges, as we've changed
1395              the arguments.  */
1396           arg0 = error_mark_node;
1397           arg1 = error_mark_node;
1398           goto do_main;
1399         case 3:
1400           if ((pos_neg0 ^ pos_neg1) == 3)
1401             {
1402               /* If one operand is known to be negative and the other
1403                  non-negative, this overflows always, unless the non-negative
1404                  one is 0.  Just do normal multiply and set overflow
1405                  unless one of the operands is 0.  */
1406               struct separate_ops ops;
1407               ops.code = MULT_EXPR;
1408               ops.type
1409                 = build_nonstandard_integer_type (GET_MODE_PRECISION (mode),
1410                                                   1);
1411               ops.op0 = make_tree (ops.type, op0);
1412               ops.op1 = make_tree (ops.type, op1);
1413               ops.op2 = NULL_TREE;
1414               ops.location = loc;
1415               res = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1416               tem = expand_binop (mode, and_optab, op0, op1, NULL_RTX, false,
1417                                   OPTAB_LIB_WIDEN);
1418               do_compare_rtx_and_jump (tem, const0_rtx, EQ, true, mode,
1419                                        NULL_RTX, NULL, done_label,
1420                                        profile_probability::very_likely ());
1421               goto do_error_label;
1422             }
1423           /* The general case, do all the needed comparisons at runtime.  */
1424           rtx_code_label *do_main_label, *after_negate_label;
1425           rtx rop0, rop1;
1426           rop0 = gen_reg_rtx (mode);
1427           rop1 = gen_reg_rtx (mode);
1428           emit_move_insn (rop0, op0);
1429           emit_move_insn (rop1, op1);
1430           op0 = rop0;
1431           op1 = rop1;
1432           do_main_label = gen_label_rtx ();
1433           after_negate_label = gen_label_rtx ();
1434           tem = expand_binop (mode, and_optab, op0, op1, NULL_RTX, false,
1435                               OPTAB_LIB_WIDEN);
1436           do_compare_rtx_and_jump (tem, const0_rtx, GE, false, mode, NULL_RTX,
1437                                    NULL, after_negate_label, profile_probability::very_likely ());
1438           /* Both arguments negative here, negate them and continue with
1439              normal unsigned overflow checking multiplication.  */
1440           emit_move_insn (op0, expand_unop (mode, neg_optab, op0,
1441                                             NULL_RTX, false));
1442           emit_move_insn (op1, expand_unop (mode, neg_optab, op1,
1443                                             NULL_RTX, false));
1444           /* Avoid looking at arg0/arg1 ranges, as we might have changed
1445              the arguments.  */
1446           arg0 = error_mark_node;
1447           arg1 = error_mark_node;
1448           emit_jump (do_main_label);
1449           emit_label (after_negate_label);
1450           tem2 = expand_binop (mode, xor_optab, op0, op1, NULL_RTX, false,
1451                                OPTAB_LIB_WIDEN);
1452           do_compare_rtx_and_jump (tem2, const0_rtx, GE, false, mode, NULL_RTX,
1453                                    NULL, do_main_label, profile_probability::very_likely ());
1454           /* One argument is negative here, the other positive.  This
1455              overflows always, unless one of the arguments is 0.  But
1456              if e.g. s2 is 0, (U) s1 * 0 doesn't overflow, whatever s1
1457              is, thus we can keep do_main code oring in overflow as is.  */
1458           do_compare_rtx_and_jump (tem, const0_rtx, EQ, true, mode, NULL_RTX,
1459                                    NULL, do_main_label, profile_probability::very_likely ());
1460           expand_arith_set_overflow (lhs, target);
1461           emit_label (do_main_label);
1462           goto do_main;
1463         default:
1464           gcc_unreachable ();
1465         }
1466     }
1467
1468  do_main:
1469   type = build_nonstandard_integer_type (GET_MODE_PRECISION (mode), uns);
1470   sign = uns ? UNSIGNED : SIGNED;
1471   icode = optab_handler (uns ? umulv4_optab : mulv4_optab, mode);
1472   if (uns
1473       && (integer_pow2p (arg0) || integer_pow2p (arg1))
1474       && (optimize_insn_for_speed_p () || icode == CODE_FOR_nothing))
1475     {
1476       /* Optimize unsigned multiplication by power of 2 constant
1477          using 2 shifts, one for result, one to extract the shifted
1478          out bits to see if they are all zero.
1479          Don't do this if optimizing for size and we have umulv4_optab,
1480          in that case assume multiplication will be shorter.
1481          This is heuristics based on the single target that provides
1482          umulv4 right now (i?86/x86_64), if further targets add it, this
1483          might need to be revisited.
1484          Cases where both operands are constant should be folded already
1485          during GIMPLE, and cases where one operand is constant but not
1486          power of 2 are questionable, either the WIDEN_MULT_EXPR case
1487          below can be done without multiplication, just by shifts and adds,
1488          or we'd need to divide the result (and hope it actually doesn't
1489          really divide nor multiply) and compare the result of the division
1490          with the original operand.  */
1491       rtx opn0 = op0;
1492       rtx opn1 = op1;
1493       tree argn0 = arg0;
1494       tree argn1 = arg1;
1495       if (integer_pow2p (arg0))
1496         {
1497           std::swap (opn0, opn1);
1498           std::swap (argn0, argn1);
1499         }
1500       int cnt = tree_log2 (argn1);
1501       if (cnt >= 0 && cnt < GET_MODE_PRECISION (mode))
1502         {
1503           rtx upper = const0_rtx;
1504           res = expand_shift (LSHIFT_EXPR, mode, opn0, cnt, NULL_RTX, uns);
1505           if (cnt != 0)
1506             upper = expand_shift (RSHIFT_EXPR, mode, opn0,
1507                                   GET_MODE_PRECISION (mode) - cnt,
1508                                   NULL_RTX, uns);
1509           do_compare_rtx_and_jump (upper, const0_rtx, EQ, true, mode,
1510                                    NULL_RTX, NULL, done_label,
1511                                    profile_probability::very_likely ());
1512           goto do_error_label;
1513         }
1514     }
1515   if (icode != CODE_FOR_nothing)
1516     {
1517       struct expand_operand ops[4];
1518       rtx_insn *last = get_last_insn ();
1519
1520       res = gen_reg_rtx (mode);
1521       create_output_operand (&ops[0], res, mode);
1522       create_input_operand (&ops[1], op0, mode);
1523       create_input_operand (&ops[2], op1, mode);
1524       create_fixed_operand (&ops[3], do_error);
1525       if (maybe_expand_insn (icode, 4, ops))
1526         {
1527           last = get_last_insn ();
1528           if (profile_status_for_fn (cfun) != PROFILE_ABSENT
1529               && JUMP_P (last)
1530               && any_condjump_p (last)
1531               && !find_reg_note (last, REG_BR_PROB, 0))
1532             add_reg_br_prob_note (last,
1533                                   profile_probability::very_unlikely ());
1534           emit_jump (done_label);
1535         }
1536       else
1537         {
1538           delete_insns_since (last);
1539           icode = CODE_FOR_nothing;
1540         }
1541     }
1542
1543   if (icode == CODE_FOR_nothing)
1544     {
1545       struct separate_ops ops;
1546       int prec = GET_MODE_PRECISION (mode);
1547       scalar_int_mode hmode, wmode;
1548       ops.op0 = make_tree (type, op0);
1549       ops.op1 = make_tree (type, op1);
1550       ops.op2 = NULL_TREE;
1551       ops.location = loc;
1552
1553       /* Optimize unsigned overflow check where we don't use the
1554          multiplication result, just whether overflow happened.
1555          If we can do MULT_HIGHPART_EXPR, that followed by
1556          comparison of the result against zero is cheapest.
1557          We'll still compute res, but it should be DCEd later.  */
1558       use_operand_p use;
1559       gimple *use_stmt;
1560       if (!is_ubsan
1561           && lhs
1562           && uns
1563           && !(uns0_p && uns1_p && !unsr_p)
1564           && can_mult_highpart_p (mode, uns) == 1
1565           && single_imm_use (lhs, &use, &use_stmt)
1566           && is_gimple_assign (use_stmt)
1567           && gimple_assign_rhs_code (use_stmt) == IMAGPART_EXPR)
1568         goto highpart;
1569
1570       if (GET_MODE_2XWIDER_MODE (mode).exists (&wmode)
1571           && targetm.scalar_mode_supported_p (wmode)
1572           && can_widen_mult_without_libcall (wmode, mode, op0, op1, uns))
1573         {
1574         twoxwider:
1575           ops.code = WIDEN_MULT_EXPR;
1576           ops.type
1577             = build_nonstandard_integer_type (GET_MODE_PRECISION (wmode), uns);
1578
1579           res = expand_expr_real_2 (&ops, NULL_RTX, wmode, EXPAND_NORMAL);
1580           rtx hipart = expand_shift (RSHIFT_EXPR, wmode, res, prec,
1581                                      NULL_RTX, uns);
1582           hipart = convert_modes (mode, wmode, hipart, uns);
1583           res = convert_modes (mode, wmode, res, uns);
1584           if (uns)
1585             /* For the unsigned multiplication, there was overflow if
1586                HIPART is non-zero.  */
1587             do_compare_rtx_and_jump (hipart, const0_rtx, EQ, true, mode,
1588                                      NULL_RTX, NULL, done_label,
1589                                      profile_probability::very_likely ());
1590           else
1591             {
1592               rtx signbit = expand_shift (RSHIFT_EXPR, mode, res, prec - 1,
1593                                           NULL_RTX, 0);
1594               /* RES is low half of the double width result, HIPART
1595                  the high half.  There was overflow if
1596                  HIPART is different from RES < 0 ? -1 : 0.  */
1597               do_compare_rtx_and_jump (signbit, hipart, EQ, true, mode,
1598                                        NULL_RTX, NULL, done_label,
1599                                        profile_probability::very_likely ());
1600             }
1601         }
1602       else if (can_mult_highpart_p (mode, uns) == 1)
1603         {
1604         highpart:
1605           ops.code = MULT_HIGHPART_EXPR;
1606           ops.type = type;
1607
1608           rtx hipart = expand_expr_real_2 (&ops, NULL_RTX, mode,
1609                                            EXPAND_NORMAL);
1610           ops.code = MULT_EXPR;
1611           res = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1612           if (uns)
1613             /* For the unsigned multiplication, there was overflow if
1614                HIPART is non-zero.  */
1615             do_compare_rtx_and_jump (hipart, const0_rtx, EQ, true, mode,
1616                                      NULL_RTX, NULL, done_label,
1617                                      profile_probability::very_likely ());
1618           else
1619             {
1620               rtx signbit = expand_shift (RSHIFT_EXPR, mode, res, prec - 1,
1621                                           NULL_RTX, 0);
1622               /* RES is low half of the double width result, HIPART
1623                  the high half.  There was overflow if
1624                  HIPART is different from RES < 0 ? -1 : 0.  */
1625               do_compare_rtx_and_jump (signbit, hipart, EQ, true, mode,
1626                                        NULL_RTX, NULL, done_label,
1627                                        profile_probability::very_likely ());
1628             }
1629
1630         }
1631       else if (int_mode_for_size (prec / 2, 1).exists (&hmode)
1632                && 2 * GET_MODE_PRECISION (hmode) == prec)
1633         {
1634           rtx_code_label *large_op0 = gen_label_rtx ();
1635           rtx_code_label *small_op0_large_op1 = gen_label_rtx ();
1636           rtx_code_label *one_small_one_large = gen_label_rtx ();
1637           rtx_code_label *both_ops_large = gen_label_rtx ();
1638           rtx_code_label *after_hipart_neg = uns ? NULL : gen_label_rtx ();
1639           rtx_code_label *after_lopart_neg = uns ? NULL : gen_label_rtx ();
1640           rtx_code_label *do_overflow = gen_label_rtx ();
1641           rtx_code_label *hipart_different = uns ? NULL : gen_label_rtx ();
1642
1643           unsigned int hprec = GET_MODE_PRECISION (hmode);
1644           rtx hipart0 = expand_shift (RSHIFT_EXPR, mode, op0, hprec,
1645                                       NULL_RTX, uns);
1646           hipart0 = convert_modes (hmode, mode, hipart0, uns);
1647           rtx lopart0 = convert_modes (hmode, mode, op0, uns);
1648           rtx signbit0 = const0_rtx;
1649           if (!uns)
1650             signbit0 = expand_shift (RSHIFT_EXPR, hmode, lopart0, hprec - 1,
1651                                      NULL_RTX, 0);
1652           rtx hipart1 = expand_shift (RSHIFT_EXPR, mode, op1, hprec,
1653                                       NULL_RTX, uns);
1654           hipart1 = convert_modes (hmode, mode, hipart1, uns);
1655           rtx lopart1 = convert_modes (hmode, mode, op1, uns);
1656           rtx signbit1 = const0_rtx;
1657           if (!uns)
1658             signbit1 = expand_shift (RSHIFT_EXPR, hmode, lopart1, hprec - 1,
1659                                      NULL_RTX, 0);
1660
1661           res = gen_reg_rtx (mode);
1662
1663           /* True if op0 resp. op1 are known to be in the range of
1664              halfstype.  */
1665           bool op0_small_p = false;
1666           bool op1_small_p = false;
1667           /* True if op0 resp. op1 are known to have all zeros or all ones
1668              in the upper half of bits, but are not known to be
1669              op{0,1}_small_p.  */
1670           bool op0_medium_p = false;
1671           bool op1_medium_p = false;
1672           /* -1 if op{0,1} is known to be negative, 0 if it is known to be
1673              nonnegative, 1 if unknown.  */
1674           int op0_sign = 1;
1675           int op1_sign = 1;
1676
1677           if (pos_neg0 == 1)
1678             op0_sign = 0;
1679           else if (pos_neg0 == 2)
1680             op0_sign = -1;
1681           if (pos_neg1 == 1)
1682             op1_sign = 0;
1683           else if (pos_neg1 == 2)
1684             op1_sign = -1;
1685
1686           unsigned int mprec0 = prec;
1687           if (arg0 != error_mark_node)
1688             mprec0 = get_min_precision (arg0, sign);
1689           if (mprec0 <= hprec)
1690             op0_small_p = true;
1691           else if (!uns && mprec0 <= hprec + 1)
1692             op0_medium_p = true;
1693           unsigned int mprec1 = prec;
1694           if (arg1 != error_mark_node)
1695             mprec1 = get_min_precision (arg1, sign);
1696           if (mprec1 <= hprec)
1697             op1_small_p = true;
1698           else if (!uns && mprec1 <= hprec + 1)
1699             op1_medium_p = true;
1700
1701           int smaller_sign = 1;
1702           int larger_sign = 1;
1703           if (op0_small_p)
1704             {
1705               smaller_sign = op0_sign;
1706               larger_sign = op1_sign;
1707             }
1708           else if (op1_small_p)
1709             {
1710               smaller_sign = op1_sign;
1711               larger_sign = op0_sign;
1712             }
1713           else if (op0_sign == op1_sign)
1714             {
1715               smaller_sign = op0_sign;
1716               larger_sign = op0_sign;
1717             }
1718
1719           if (!op0_small_p)
1720             do_compare_rtx_and_jump (signbit0, hipart0, NE, true, hmode,
1721                                      NULL_RTX, NULL, large_op0,
1722                                      profile_probability::unlikely ());
1723
1724           if (!op1_small_p)
1725             do_compare_rtx_and_jump (signbit1, hipart1, NE, true, hmode,
1726                                      NULL_RTX, NULL, small_op0_large_op1,
1727                                      profile_probability::unlikely ());
1728
1729           /* If both op0 and op1 are sign (!uns) or zero (uns) extended from
1730              hmode to mode, the multiplication will never overflow.  We can
1731              do just one hmode x hmode => mode widening multiplication.  */
1732           rtx lopart0s = lopart0, lopart1s = lopart1;
1733           if (GET_CODE (lopart0) == SUBREG)
1734             {
1735               lopart0s = shallow_copy_rtx (lopart0);
1736               SUBREG_PROMOTED_VAR_P (lopart0s) = 1;
1737               SUBREG_PROMOTED_SET (lopart0s, uns ? SRP_UNSIGNED : SRP_SIGNED);
1738             }
1739           if (GET_CODE (lopart1) == SUBREG)
1740             {
1741               lopart1s = shallow_copy_rtx (lopart1);
1742               SUBREG_PROMOTED_VAR_P (lopart1s) = 1;
1743               SUBREG_PROMOTED_SET (lopart1s, uns ? SRP_UNSIGNED : SRP_SIGNED);
1744             }
1745           tree halfstype = build_nonstandard_integer_type (hprec, uns);
1746           ops.op0 = make_tree (halfstype, lopart0s);
1747           ops.op1 = make_tree (halfstype, lopart1s);
1748           ops.code = WIDEN_MULT_EXPR;
1749           ops.type = type;
1750           rtx thisres
1751             = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1752           emit_move_insn (res, thisres);
1753           emit_jump (done_label);
1754
1755           emit_label (small_op0_large_op1);
1756
1757           /* If op0 is sign (!uns) or zero (uns) extended from hmode to mode,
1758              but op1 is not, just swap the arguments and handle it as op1
1759              sign/zero extended, op0 not.  */
1760           rtx larger = gen_reg_rtx (mode);
1761           rtx hipart = gen_reg_rtx (hmode);
1762           rtx lopart = gen_reg_rtx (hmode);
1763           emit_move_insn (larger, op1);
1764           emit_move_insn (hipart, hipart1);
1765           emit_move_insn (lopart, lopart0);
1766           emit_jump (one_small_one_large);
1767
1768           emit_label (large_op0);
1769
1770           if (!op1_small_p)
1771             do_compare_rtx_and_jump (signbit1, hipart1, NE, true, hmode,
1772                                      NULL_RTX, NULL, both_ops_large,
1773                                      profile_probability::unlikely ());
1774
1775           /* If op1 is sign (!uns) or zero (uns) extended from hmode to mode,
1776              but op0 is not, prepare larger, hipart and lopart pseudos and
1777              handle it together with small_op0_large_op1.  */
1778           emit_move_insn (larger, op0);
1779           emit_move_insn (hipart, hipart0);
1780           emit_move_insn (lopart, lopart1);
1781
1782           emit_label (one_small_one_large);
1783
1784           /* lopart is the low part of the operand that is sign extended
1785              to mode, larger is the other operand, hipart is the
1786              high part of larger and lopart0 and lopart1 are the low parts
1787              of both operands.
1788              We perform lopart0 * lopart1 and lopart * hipart widening
1789              multiplications.  */
1790           tree halfutype = build_nonstandard_integer_type (hprec, 1);
1791           ops.op0 = make_tree (halfutype, lopart0);
1792           ops.op1 = make_tree (halfutype, lopart1);
1793           rtx lo0xlo1
1794             = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1795
1796           ops.op0 = make_tree (halfutype, lopart);
1797           ops.op1 = make_tree (halfutype, hipart);
1798           rtx loxhi = gen_reg_rtx (mode);
1799           rtx tem = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1800           emit_move_insn (loxhi, tem);
1801
1802           if (!uns)
1803             {
1804               /* if (hipart < 0) loxhi -= lopart << (bitsize / 2);  */
1805               if (larger_sign == 0)
1806                 emit_jump (after_hipart_neg);
1807               else if (larger_sign != -1)
1808                 do_compare_rtx_and_jump (hipart, const0_rtx, GE, false, hmode,
1809                                          NULL_RTX, NULL, after_hipart_neg,
1810                                          profile_probability::even ());
1811
1812               tem = convert_modes (mode, hmode, lopart, 1);
1813               tem = expand_shift (LSHIFT_EXPR, mode, tem, hprec, NULL_RTX, 1);
1814               tem = expand_simple_binop (mode, MINUS, loxhi, tem, NULL_RTX,
1815                                          1, OPTAB_WIDEN);
1816               emit_move_insn (loxhi, tem);
1817
1818               emit_label (after_hipart_neg);
1819
1820               /* if (lopart < 0) loxhi -= larger;  */
1821               if (smaller_sign == 0)
1822                 emit_jump (after_lopart_neg);
1823               else if (smaller_sign != -1)
1824                 do_compare_rtx_and_jump (lopart, const0_rtx, GE, false, hmode,
1825                                          NULL_RTX, NULL, after_lopart_neg,
1826                                          profile_probability::even ());
1827
1828               tem = expand_simple_binop (mode, MINUS, loxhi, larger, NULL_RTX,
1829                                          1, OPTAB_WIDEN);
1830               emit_move_insn (loxhi, tem);
1831
1832               emit_label (after_lopart_neg);
1833             }
1834
1835           /* loxhi += (uns) lo0xlo1 >> (bitsize / 2);  */
1836           tem = expand_shift (RSHIFT_EXPR, mode, lo0xlo1, hprec, NULL_RTX, 1);
1837           tem = expand_simple_binop (mode, PLUS, loxhi, tem, NULL_RTX,
1838                                      1, OPTAB_WIDEN);
1839           emit_move_insn (loxhi, tem);
1840
1841           /* if (loxhi >> (bitsize / 2)
1842                  == (hmode) loxhi >> (bitsize / 2 - 1))  (if !uns)
1843              if (loxhi >> (bitsize / 2) == 0             (if uns).  */
1844           rtx hipartloxhi = expand_shift (RSHIFT_EXPR, mode, loxhi, hprec,
1845                                           NULL_RTX, 0);
1846           hipartloxhi = convert_modes (hmode, mode, hipartloxhi, 0);
1847           rtx signbitloxhi = const0_rtx;
1848           if (!uns)
1849             signbitloxhi = expand_shift (RSHIFT_EXPR, hmode,
1850                                          convert_modes (hmode, mode,
1851                                                         loxhi, 0),
1852                                          hprec - 1, NULL_RTX, 0);
1853
1854           do_compare_rtx_and_jump (signbitloxhi, hipartloxhi, NE, true, hmode,
1855                                    NULL_RTX, NULL, do_overflow,
1856                                    profile_probability::very_unlikely ());
1857
1858           /* res = (loxhi << (bitsize / 2)) | (hmode) lo0xlo1;  */
1859           rtx loxhishifted = expand_shift (LSHIFT_EXPR, mode, loxhi, hprec,
1860                                            NULL_RTX, 1);
1861           tem = convert_modes (mode, hmode,
1862                                convert_modes (hmode, mode, lo0xlo1, 1), 1);
1863
1864           tem = expand_simple_binop (mode, IOR, loxhishifted, tem, res,
1865                                      1, OPTAB_WIDEN);
1866           if (tem != res)
1867             emit_move_insn (res, tem);
1868           emit_jump (done_label);
1869
1870           emit_label (both_ops_large);
1871
1872           /* If both operands are large (not sign (!uns) or zero (uns)
1873              extended from hmode), then perform the full multiplication
1874              which will be the result of the operation.
1875              The only cases which don't overflow are for signed multiplication
1876              some cases where both hipart0 and highpart1 are 0 or -1.
1877              For unsigned multiplication when high parts are both non-zero
1878              this overflows always.  */
1879           ops.code = MULT_EXPR;
1880           ops.op0 = make_tree (type, op0);
1881           ops.op1 = make_tree (type, op1);
1882           tem = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1883           emit_move_insn (res, tem);
1884
1885           if (!uns)
1886             {
1887               if (!op0_medium_p)
1888                 {
1889                   tem = expand_simple_binop (hmode, PLUS, hipart0, const1_rtx,
1890                                              NULL_RTX, 1, OPTAB_WIDEN);
1891                   do_compare_rtx_and_jump (tem, const1_rtx, GTU, true, hmode,
1892                                            NULL_RTX, NULL, do_error,
1893                                            profile_probability::very_unlikely ());
1894                 }
1895
1896               if (!op1_medium_p)
1897                 {
1898                   tem = expand_simple_binop (hmode, PLUS, hipart1, const1_rtx,
1899                                              NULL_RTX, 1, OPTAB_WIDEN);
1900                   do_compare_rtx_and_jump (tem, const1_rtx, GTU, true, hmode,
1901                                            NULL_RTX, NULL, do_error,
1902                                            profile_probability::very_unlikely ());
1903                 }
1904
1905               /* At this point hipart{0,1} are both in [-1, 0].  If they are
1906                  the same, overflow happened if res is non-positive, if they
1907                  are different, overflow happened if res is positive.  */
1908               if (op0_sign != 1 && op1_sign != 1 && op0_sign != op1_sign)
1909                 emit_jump (hipart_different);
1910               else if (op0_sign == 1 || op1_sign == 1)
1911                 do_compare_rtx_and_jump (hipart0, hipart1, NE, true, hmode,
1912                                          NULL_RTX, NULL, hipart_different,
1913                                          profile_probability::even ());
1914
1915               do_compare_rtx_and_jump (res, const0_rtx, LE, false, mode,
1916                                        NULL_RTX, NULL, do_error,
1917                                        profile_probability::very_unlikely ());
1918               emit_jump (done_label);
1919
1920               emit_label (hipart_different);
1921
1922               do_compare_rtx_and_jump (res, const0_rtx, GE, false, mode,
1923                                        NULL_RTX, NULL, do_error,
1924                                        profile_probability::very_unlikely ());
1925               emit_jump (done_label);
1926             }
1927
1928           emit_label (do_overflow);
1929
1930           /* Overflow, do full multiplication and fallthru into do_error.  */
1931           ops.op0 = make_tree (type, op0);
1932           ops.op1 = make_tree (type, op1);
1933           tem = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1934           emit_move_insn (res, tem);
1935         }
1936       else if (GET_MODE_2XWIDER_MODE (mode).exists (&wmode)
1937                && targetm.scalar_mode_supported_p (wmode))
1938         /* Even emitting a libcall is better than not detecting overflow
1939            at all.  */
1940         goto twoxwider;
1941       else
1942         {
1943           gcc_assert (!is_ubsan);
1944           ops.code = MULT_EXPR;
1945           ops.type = type;
1946           res = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
1947           emit_jump (done_label);
1948         }
1949     }
1950
1951  do_error_label:
1952   emit_label (do_error);
1953   if (is_ubsan)
1954     {
1955       /* Expand the ubsan builtin call.  */
1956       push_temp_slots ();
1957       fn = ubsan_build_overflow_builtin (MULT_EXPR, loc, TREE_TYPE (arg0),
1958                                          arg0, arg1, datap);
1959       expand_normal (fn);
1960       pop_temp_slots ();
1961       do_pending_stack_adjust ();
1962     }
1963   else if (lhs)
1964     expand_arith_set_overflow (lhs, target);
1965
1966   /* We're done.  */
1967   emit_label (done_label);
1968
1969   /* u1 * u2 -> sr  */
1970   if (uns0_p && uns1_p && !unsr_p)
1971     {
1972       rtx_code_label *all_done_label = gen_label_rtx ();
1973       do_compare_rtx_and_jump (res, const0_rtx, GE, false, mode, NULL_RTX,
1974                                NULL, all_done_label, profile_probability::very_likely ());
1975       expand_arith_set_overflow (lhs, target);
1976       emit_label (all_done_label);
1977     }
1978
1979   /* s1 * u2 -> sr  */
1980   if (!uns0_p && uns1_p && !unsr_p && pos_neg1 == 3)
1981     {
1982       rtx_code_label *all_done_label = gen_label_rtx ();
1983       rtx_code_label *set_noovf = gen_label_rtx ();
1984       do_compare_rtx_and_jump (op1, const0_rtx, GE, false, mode, NULL_RTX,
1985                                NULL, all_done_label, profile_probability::very_likely ());
1986       expand_arith_set_overflow (lhs, target);
1987       do_compare_rtx_and_jump (op0, const0_rtx, EQ, true, mode, NULL_RTX,
1988                                NULL, set_noovf, profile_probability::very_likely ());
1989       do_compare_rtx_and_jump (op0, constm1_rtx, NE, true, mode, NULL_RTX,
1990                                NULL, all_done_label, profile_probability::very_unlikely ());
1991       do_compare_rtx_and_jump (op1, res, NE, true, mode, NULL_RTX, NULL,
1992                                all_done_label, profile_probability::very_unlikely ());
1993       emit_label (set_noovf);
1994       write_complex_part (target, const0_rtx, true);
1995       emit_label (all_done_label);
1996     }
1997
1998   if (lhs)
1999     {
2000       if (is_ubsan)
2001         expand_ubsan_result_store (target, res);
2002       else
2003         expand_arith_overflow_result_store (lhs, target, mode, res);
2004     }
2005 }
2006
2007 /* Expand UBSAN_CHECK_* internal function if it has vector operands.  */
2008
2009 static void
2010 expand_vector_ubsan_overflow (location_t loc, enum tree_code code, tree lhs,
2011                               tree arg0, tree arg1)
2012 {
2013   poly_uint64 cnt = TYPE_VECTOR_SUBPARTS (TREE_TYPE (arg0));
2014   rtx_code_label *loop_lab = NULL;
2015   rtx cntvar = NULL_RTX;
2016   tree cntv = NULL_TREE;
2017   tree eltype = TREE_TYPE (TREE_TYPE (arg0));
2018   tree sz = TYPE_SIZE (eltype);
2019   tree data = NULL_TREE;
2020   tree resv = NULL_TREE;
2021   rtx lhsr = NULL_RTX;
2022   rtx resvr = NULL_RTX;
2023   unsigned HOST_WIDE_INT const_cnt = 0;
2024   bool use_loop_p = (!cnt.is_constant (&const_cnt) || const_cnt > 4);
2025
2026   if (lhs)
2027     {
2028       optab op;
2029       lhsr = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2030       if (!VECTOR_MODE_P (GET_MODE (lhsr))
2031           || (op = optab_for_tree_code (code, TREE_TYPE (arg0),
2032                                         optab_default)) == unknown_optab
2033           || (optab_handler (op, TYPE_MODE (TREE_TYPE (arg0)))
2034               == CODE_FOR_nothing))
2035         {
2036           if (MEM_P (lhsr))
2037             resv = make_tree (TREE_TYPE (lhs), lhsr);
2038           else
2039             {
2040               resvr = assign_temp (TREE_TYPE (lhs), 1, 1);
2041               resv = make_tree (TREE_TYPE (lhs), resvr);
2042             }
2043         }
2044     }
2045   if (use_loop_p)
2046     {
2047       do_pending_stack_adjust ();
2048       loop_lab = gen_label_rtx ();
2049       cntvar = gen_reg_rtx (TYPE_MODE (sizetype));
2050       cntv = make_tree (sizetype, cntvar);
2051       emit_move_insn (cntvar, const0_rtx);
2052       emit_label (loop_lab);
2053     }
2054   if (TREE_CODE (arg0) != VECTOR_CST)
2055     {
2056       rtx arg0r = expand_normal (arg0);
2057       arg0 = make_tree (TREE_TYPE (arg0), arg0r);
2058     }
2059   if (TREE_CODE (arg1) != VECTOR_CST)
2060     {
2061       rtx arg1r = expand_normal (arg1);
2062       arg1 = make_tree (TREE_TYPE (arg1), arg1r);
2063     }
2064   for (unsigned int i = 0; i < (use_loop_p ? 1 : const_cnt); i++)
2065     {
2066       tree op0, op1, res = NULL_TREE;
2067       if (use_loop_p)
2068         {
2069           tree atype = build_array_type_nelts (eltype, cnt);
2070           op0 = uniform_vector_p (arg0);
2071           if (op0 == NULL_TREE)
2072             {
2073               op0 = fold_build1_loc (loc, VIEW_CONVERT_EXPR, atype, arg0);
2074               op0 = build4_loc (loc, ARRAY_REF, eltype, op0, cntv,
2075                                 NULL_TREE, NULL_TREE);
2076             }
2077           op1 = uniform_vector_p (arg1);
2078           if (op1 == NULL_TREE)
2079             {
2080               op1 = fold_build1_loc (loc, VIEW_CONVERT_EXPR, atype, arg1);
2081               op1 = build4_loc (loc, ARRAY_REF, eltype, op1, cntv,
2082                                 NULL_TREE, NULL_TREE);
2083             }
2084           if (resv)
2085             {
2086               res = fold_build1_loc (loc, VIEW_CONVERT_EXPR, atype, resv);
2087               res = build4_loc (loc, ARRAY_REF, eltype, res, cntv,
2088                                 NULL_TREE, NULL_TREE);
2089             }
2090         }
2091       else
2092         {
2093           tree bitpos = bitsize_int (tree_to_uhwi (sz) * i);
2094           op0 = fold_build3_loc (loc, BIT_FIELD_REF, eltype, arg0, sz, bitpos);
2095           op1 = fold_build3_loc (loc, BIT_FIELD_REF, eltype, arg1, sz, bitpos);
2096           if (resv)
2097             res = fold_build3_loc (loc, BIT_FIELD_REF, eltype, resv, sz,
2098                                    bitpos);
2099         }
2100       switch (code)
2101         {
2102         case PLUS_EXPR:
2103           expand_addsub_overflow (loc, PLUS_EXPR, res, op0, op1,
2104                                   false, false, false, true, &data);
2105           break;
2106         case MINUS_EXPR:
2107           if (use_loop_p ? integer_zerop (arg0) : integer_zerop (op0))
2108             expand_neg_overflow (loc, res, op1, true, &data);
2109           else
2110             expand_addsub_overflow (loc, MINUS_EXPR, res, op0, op1,
2111                                     false, false, false, true, &data);
2112           break;
2113         case MULT_EXPR:
2114           expand_mul_overflow (loc, res, op0, op1, false, false, false,
2115                                true, &data);
2116           break;
2117         default:
2118           gcc_unreachable ();
2119         }
2120     }
2121   if (use_loop_p)
2122     {
2123       struct separate_ops ops;
2124       ops.code = PLUS_EXPR;
2125       ops.type = TREE_TYPE (cntv);
2126       ops.op0 = cntv;
2127       ops.op1 = build_int_cst (TREE_TYPE (cntv), 1);
2128       ops.op2 = NULL_TREE;
2129       ops.location = loc;
2130       rtx ret = expand_expr_real_2 (&ops, cntvar, TYPE_MODE (sizetype),
2131                                     EXPAND_NORMAL);
2132       if (ret != cntvar)
2133         emit_move_insn (cntvar, ret);
2134       rtx cntrtx = gen_int_mode (cnt, TYPE_MODE (sizetype));
2135       do_compare_rtx_and_jump (cntvar, cntrtx, NE, false,
2136                                TYPE_MODE (sizetype), NULL_RTX, NULL, loop_lab,
2137                                profile_probability::very_likely ());
2138     }
2139   if (lhs && resv == NULL_TREE)
2140     {
2141       struct separate_ops ops;
2142       ops.code = code;
2143       ops.type = TREE_TYPE (arg0);
2144       ops.op0 = arg0;
2145       ops.op1 = arg1;
2146       ops.op2 = NULL_TREE;
2147       ops.location = loc;
2148       rtx ret = expand_expr_real_2 (&ops, lhsr, TYPE_MODE (TREE_TYPE (arg0)),
2149                                     EXPAND_NORMAL);
2150       if (ret != lhsr)
2151         emit_move_insn (lhsr, ret);
2152     }
2153   else if (resvr)
2154     emit_move_insn (lhsr, resvr);
2155 }
2156
2157 /* Expand UBSAN_CHECK_ADD call STMT.  */
2158
2159 static void
2160 expand_UBSAN_CHECK_ADD (internal_fn, gcall *stmt)
2161 {
2162   location_t loc = gimple_location (stmt);
2163   tree lhs = gimple_call_lhs (stmt);
2164   tree arg0 = gimple_call_arg (stmt, 0);
2165   tree arg1 = gimple_call_arg (stmt, 1);
2166   if (VECTOR_TYPE_P (TREE_TYPE (arg0)))
2167     expand_vector_ubsan_overflow (loc, PLUS_EXPR, lhs, arg0, arg1);
2168   else
2169     expand_addsub_overflow (loc, PLUS_EXPR, lhs, arg0, arg1,
2170                             false, false, false, true, NULL);
2171 }
2172
2173 /* Expand UBSAN_CHECK_SUB call STMT.  */
2174
2175 static void
2176 expand_UBSAN_CHECK_SUB (internal_fn, gcall *stmt)
2177 {
2178   location_t loc = gimple_location (stmt);
2179   tree lhs = gimple_call_lhs (stmt);
2180   tree arg0 = gimple_call_arg (stmt, 0);
2181   tree arg1 = gimple_call_arg (stmt, 1);
2182   if (VECTOR_TYPE_P (TREE_TYPE (arg0)))
2183     expand_vector_ubsan_overflow (loc, MINUS_EXPR, lhs, arg0, arg1);
2184   else if (integer_zerop (arg0))
2185     expand_neg_overflow (loc, lhs, arg1, true, NULL);
2186   else
2187     expand_addsub_overflow (loc, MINUS_EXPR, lhs, arg0, arg1,
2188                             false, false, false, true, NULL);
2189 }
2190
2191 /* Expand UBSAN_CHECK_MUL call STMT.  */
2192
2193 static void
2194 expand_UBSAN_CHECK_MUL (internal_fn, gcall *stmt)
2195 {
2196   location_t loc = gimple_location (stmt);
2197   tree lhs = gimple_call_lhs (stmt);
2198   tree arg0 = gimple_call_arg (stmt, 0);
2199   tree arg1 = gimple_call_arg (stmt, 1);
2200   if (VECTOR_TYPE_P (TREE_TYPE (arg0)))
2201     expand_vector_ubsan_overflow (loc, MULT_EXPR, lhs, arg0, arg1);
2202   else
2203     expand_mul_overflow (loc, lhs, arg0, arg1, false, false, false, true,
2204                          NULL);
2205 }
2206
2207 /* Helper function for {ADD,SUB,MUL}_OVERFLOW call stmt expansion.  */
2208
2209 static void
2210 expand_arith_overflow (enum tree_code code, gimple *stmt)
2211 {
2212   tree lhs = gimple_call_lhs (stmt);
2213   if (lhs == NULL_TREE)
2214     return;
2215   tree arg0 = gimple_call_arg (stmt, 0);
2216   tree arg1 = gimple_call_arg (stmt, 1);
2217   tree type = TREE_TYPE (TREE_TYPE (lhs));
2218   int uns0_p = TYPE_UNSIGNED (TREE_TYPE (arg0));
2219   int uns1_p = TYPE_UNSIGNED (TREE_TYPE (arg1));
2220   int unsr_p = TYPE_UNSIGNED (type);
2221   int prec0 = TYPE_PRECISION (TREE_TYPE (arg0));
2222   int prec1 = TYPE_PRECISION (TREE_TYPE (arg1));
2223   int precres = TYPE_PRECISION (type);
2224   location_t loc = gimple_location (stmt);
2225   if (!uns0_p && get_range_pos_neg (arg0) == 1)
2226     uns0_p = true;
2227   if (!uns1_p && get_range_pos_neg (arg1) == 1)
2228     uns1_p = true;
2229   int pr = get_min_precision (arg0, uns0_p ? UNSIGNED : SIGNED);
2230   prec0 = MIN (prec0, pr);
2231   pr = get_min_precision (arg1, uns1_p ? UNSIGNED : SIGNED);
2232   prec1 = MIN (prec1, pr);
2233
2234   /* If uns0_p && uns1_p, precop is minimum needed precision
2235      of unsigned type to hold the exact result, otherwise
2236      precop is minimum needed precision of signed type to
2237      hold the exact result.  */
2238   int precop;
2239   if (code == MULT_EXPR)
2240     precop = prec0 + prec1 + (uns0_p != uns1_p);
2241   else
2242     {
2243       if (uns0_p == uns1_p)
2244         precop = MAX (prec0, prec1) + 1;
2245       else if (uns0_p)
2246         precop = MAX (prec0 + 1, prec1) + 1;
2247       else
2248         precop = MAX (prec0, prec1 + 1) + 1;
2249     }
2250   int orig_precres = precres;
2251
2252   do
2253     {
2254       if ((uns0_p && uns1_p)
2255           ? ((precop + !unsr_p) <= precres
2256              /* u1 - u2 -> ur can overflow, no matter what precision
2257                 the result has.  */
2258              && (code != MINUS_EXPR || !unsr_p))
2259           : (!unsr_p && precop <= precres))
2260         {
2261           /* The infinity precision result will always fit into result.  */
2262           rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2263           write_complex_part (target, const0_rtx, true);
2264           scalar_int_mode mode = SCALAR_INT_TYPE_MODE (type);
2265           struct separate_ops ops;
2266           ops.code = code;
2267           ops.type = type;
2268           ops.op0 = fold_convert_loc (loc, type, arg0);
2269           ops.op1 = fold_convert_loc (loc, type, arg1);
2270           ops.op2 = NULL_TREE;
2271           ops.location = loc;
2272           rtx tem = expand_expr_real_2 (&ops, NULL_RTX, mode, EXPAND_NORMAL);
2273           expand_arith_overflow_result_store (lhs, target, mode, tem);
2274           return;
2275         }
2276
2277       /* For operations with low precision, if target doesn't have them, start
2278          with precres widening right away, otherwise do it only if the most
2279          simple cases can't be used.  */
2280       const int min_precision = targetm.min_arithmetic_precision ();
2281       if (orig_precres == precres && precres < min_precision)
2282         ;
2283       else if ((uns0_p && uns1_p && unsr_p && prec0 <= precres
2284                 && prec1 <= precres)
2285           || ((!uns0_p || !uns1_p) && !unsr_p
2286               && prec0 + uns0_p <= precres
2287               && prec1 + uns1_p <= precres))
2288         {
2289           arg0 = fold_convert_loc (loc, type, arg0);
2290           arg1 = fold_convert_loc (loc, type, arg1);
2291           switch (code)
2292             {
2293             case MINUS_EXPR:
2294               if (integer_zerop (arg0) && !unsr_p)
2295                 {
2296                   expand_neg_overflow (loc, lhs, arg1, false, NULL);
2297                   return;
2298                 }
2299               /* FALLTHRU */
2300             case PLUS_EXPR:
2301               expand_addsub_overflow (loc, code, lhs, arg0, arg1, unsr_p,
2302                                       unsr_p, unsr_p, false, NULL);
2303               return;
2304             case MULT_EXPR:
2305               expand_mul_overflow (loc, lhs, arg0, arg1, unsr_p,
2306                                    unsr_p, unsr_p, false, NULL);
2307               return;
2308             default:
2309               gcc_unreachable ();
2310             }
2311         }
2312
2313       /* For sub-word operations, retry with a wider type first.  */
2314       if (orig_precres == precres && precop <= BITS_PER_WORD)
2315         {
2316           int p = MAX (min_precision, precop);
2317           scalar_int_mode m = smallest_int_mode_for_size (p);
2318           tree optype = build_nonstandard_integer_type (GET_MODE_PRECISION (m),
2319                                                         uns0_p && uns1_p
2320                                                         && unsr_p);
2321           p = TYPE_PRECISION (optype);
2322           if (p > precres)
2323             {
2324               precres = p;
2325               unsr_p = TYPE_UNSIGNED (optype);
2326               type = optype;
2327               continue;
2328             }
2329         }
2330
2331       if (prec0 <= precres && prec1 <= precres)
2332         {
2333           tree types[2];
2334           if (unsr_p)
2335             {
2336               types[0] = build_nonstandard_integer_type (precres, 0);
2337               types[1] = type;
2338             }
2339           else
2340             {
2341               types[0] = type;
2342               types[1] = build_nonstandard_integer_type (precres, 1);
2343             }
2344           arg0 = fold_convert_loc (loc, types[uns0_p], arg0);
2345           arg1 = fold_convert_loc (loc, types[uns1_p], arg1);
2346           if (code != MULT_EXPR)
2347             expand_addsub_overflow (loc, code, lhs, arg0, arg1, unsr_p,
2348                                     uns0_p, uns1_p, false, NULL);
2349           else
2350             expand_mul_overflow (loc, lhs, arg0, arg1, unsr_p,
2351                                  uns0_p, uns1_p, false, NULL);
2352           return;
2353         }
2354
2355       /* Retry with a wider type.  */
2356       if (orig_precres == precres)
2357         {
2358           int p = MAX (prec0, prec1);
2359           scalar_int_mode m = smallest_int_mode_for_size (p);
2360           tree optype = build_nonstandard_integer_type (GET_MODE_PRECISION (m),
2361                                                         uns0_p && uns1_p
2362                                                         && unsr_p);
2363           p = TYPE_PRECISION (optype);
2364           if (p > precres)
2365             {
2366               precres = p;
2367               unsr_p = TYPE_UNSIGNED (optype);
2368               type = optype;
2369               continue;
2370             }
2371         }
2372
2373       gcc_unreachable ();
2374     }
2375   while (1);
2376 }
2377
2378 /* Expand ADD_OVERFLOW STMT.  */
2379
2380 static void
2381 expand_ADD_OVERFLOW (internal_fn, gcall *stmt)
2382 {
2383   expand_arith_overflow (PLUS_EXPR, stmt);
2384 }
2385
2386 /* Expand SUB_OVERFLOW STMT.  */
2387
2388 static void
2389 expand_SUB_OVERFLOW (internal_fn, gcall *stmt)
2390 {
2391   expand_arith_overflow (MINUS_EXPR, stmt);
2392 }
2393
2394 /* Expand MUL_OVERFLOW STMT.  */
2395
2396 static void
2397 expand_MUL_OVERFLOW (internal_fn, gcall *stmt)
2398 {
2399   expand_arith_overflow (MULT_EXPR, stmt);
2400 }
2401
2402 /* This should get folded in tree-vectorizer.c.  */
2403
2404 static void
2405 expand_LOOP_VECTORIZED (internal_fn, gcall *)
2406 {
2407   gcc_unreachable ();
2408 }
2409
2410 /* This should get folded in tree-vectorizer.c.  */
2411
2412 static void
2413 expand_LOOP_DIST_ALIAS (internal_fn, gcall *)
2414 {
2415   gcc_unreachable ();
2416 }
2417
2418 /* Return a memory reference of type TYPE for argument INDEX of STMT.
2419    Use argument INDEX + 1 to derive the second (TBAA) operand.  */
2420
2421 static tree
2422 expand_call_mem_ref (tree type, gcall *stmt, int index)
2423 {
2424   tree addr = gimple_call_arg (stmt, index);
2425   tree alias_ptr_type = TREE_TYPE (gimple_call_arg (stmt, index + 1));
2426   unsigned int align = tree_to_shwi (gimple_call_arg (stmt, index + 1));
2427   if (TYPE_ALIGN (type) != align)
2428     type = build_aligned_type (type, align);
2429
2430   tree tmp = addr;
2431   if (TREE_CODE (tmp) == SSA_NAME)
2432     {
2433       gimple *def = SSA_NAME_DEF_STMT (tmp);
2434       if (gimple_assign_single_p (def))
2435         tmp = gimple_assign_rhs1 (def);
2436     }
2437
2438   if (TREE_CODE (tmp) == ADDR_EXPR)
2439     {
2440       tree mem = TREE_OPERAND (tmp, 0);
2441       if (TREE_CODE (mem) == TARGET_MEM_REF
2442           && types_compatible_p (TREE_TYPE (mem), type))
2443         {
2444           tree offset = TMR_OFFSET (mem);
2445           if (alias_ptr_type != TREE_TYPE (offset) || !integer_zerop (offset))
2446             {
2447               mem = copy_node (mem);
2448               TMR_OFFSET (mem) = wide_int_to_tree (alias_ptr_type,
2449                                                    wi::to_poly_wide (offset));
2450             }
2451           return mem;
2452         }
2453     }
2454
2455   return fold_build2 (MEM_REF, type, addr, build_int_cst (alias_ptr_type, 0));
2456 }
2457
2458 /* Expand MASK_LOAD{,_LANES} call STMT using optab OPTAB.  */
2459
2460 static void
2461 expand_mask_load_optab_fn (internal_fn, gcall *stmt, convert_optab optab)
2462 {
2463   struct expand_operand ops[3];
2464   tree type, lhs, rhs, maskt;
2465   rtx mem, target, mask;
2466   insn_code icode;
2467
2468   maskt = gimple_call_arg (stmt, 2);
2469   lhs = gimple_call_lhs (stmt);
2470   if (lhs == NULL_TREE)
2471     return;
2472   type = TREE_TYPE (lhs);
2473   rhs = expand_call_mem_ref (type, stmt, 0);
2474
2475   if (optab == vec_mask_load_lanes_optab)
2476     icode = get_multi_vector_move (type, optab);
2477   else
2478     icode = convert_optab_handler (optab, TYPE_MODE (type),
2479                                    TYPE_MODE (TREE_TYPE (maskt)));
2480
2481   mem = expand_expr (rhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2482   gcc_assert (MEM_P (mem));
2483   mask = expand_normal (maskt);
2484   target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2485   create_output_operand (&ops[0], target, TYPE_MODE (type));
2486   create_fixed_operand (&ops[1], mem);
2487   create_input_operand (&ops[2], mask, TYPE_MODE (TREE_TYPE (maskt)));
2488   expand_insn (icode, 3, ops);
2489 }
2490
2491 #define expand_mask_load_lanes_optab_fn expand_mask_load_optab_fn
2492
2493 /* Expand MASK_STORE{,_LANES} call STMT using optab OPTAB.  */
2494
2495 static void
2496 expand_mask_store_optab_fn (internal_fn, gcall *stmt, convert_optab optab)
2497 {
2498   struct expand_operand ops[3];
2499   tree type, lhs, rhs, maskt;
2500   rtx mem, reg, mask;
2501   insn_code icode;
2502
2503   maskt = gimple_call_arg (stmt, 2);
2504   rhs = gimple_call_arg (stmt, 3);
2505   type = TREE_TYPE (rhs);
2506   lhs = expand_call_mem_ref (type, stmt, 0);
2507
2508   if (optab == vec_mask_store_lanes_optab)
2509     icode = get_multi_vector_move (type, optab);
2510   else
2511     icode = convert_optab_handler (optab, TYPE_MODE (type),
2512                                    TYPE_MODE (TREE_TYPE (maskt)));
2513
2514   mem = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2515   gcc_assert (MEM_P (mem));
2516   mask = expand_normal (maskt);
2517   reg = expand_normal (rhs);
2518   create_fixed_operand (&ops[0], mem);
2519   create_input_operand (&ops[1], reg, TYPE_MODE (type));
2520   create_input_operand (&ops[2], mask, TYPE_MODE (TREE_TYPE (maskt)));
2521   expand_insn (icode, 3, ops);
2522 }
2523
2524 #define expand_mask_store_lanes_optab_fn expand_mask_store_optab_fn
2525
2526 static void
2527 expand_ABNORMAL_DISPATCHER (internal_fn, gcall *)
2528 {
2529 }
2530
2531 static void
2532 expand_BUILTIN_EXPECT (internal_fn, gcall *stmt)
2533 {
2534   /* When guessing was done, the hints should be already stripped away.  */
2535   gcc_assert (!flag_guess_branch_prob || optimize == 0 || seen_error ());
2536
2537   rtx target;
2538   tree lhs = gimple_call_lhs (stmt);
2539   if (lhs)
2540     target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2541   else
2542     target = const0_rtx;
2543   rtx val = expand_expr (gimple_call_arg (stmt, 0), target, VOIDmode, EXPAND_NORMAL);
2544   if (lhs && val != target)
2545     emit_move_insn (target, val);
2546 }
2547
2548 /* IFN_VA_ARG is supposed to be expanded at pass_stdarg.  So this dummy function
2549    should never be called.  */
2550
2551 static void
2552 expand_VA_ARG (internal_fn, gcall *)
2553 {
2554   gcc_unreachable ();
2555 }
2556
2557 /* Expand the IFN_UNIQUE function according to its first argument.  */
2558
2559 static void
2560 expand_UNIQUE (internal_fn, gcall *stmt)
2561 {
2562   rtx pattern = NULL_RTX;
2563   enum ifn_unique_kind kind
2564     = (enum ifn_unique_kind) TREE_INT_CST_LOW (gimple_call_arg (stmt, 0));
2565
2566   switch (kind)
2567     {
2568     default:
2569       gcc_unreachable ();
2570
2571     case IFN_UNIQUE_UNSPEC:
2572       if (targetm.have_unique ())
2573         pattern = targetm.gen_unique ();
2574       break;
2575
2576     case IFN_UNIQUE_OACC_FORK:
2577     case IFN_UNIQUE_OACC_JOIN:
2578       if (targetm.have_oacc_fork () && targetm.have_oacc_join ())
2579         {
2580           tree lhs = gimple_call_lhs (stmt);
2581           rtx target = const0_rtx;
2582
2583           if (lhs)
2584             target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2585
2586           rtx data_dep = expand_normal (gimple_call_arg (stmt, 1));
2587           rtx axis = expand_normal (gimple_call_arg (stmt, 2));
2588
2589           if (kind == IFN_UNIQUE_OACC_FORK)
2590             pattern = targetm.gen_oacc_fork (target, data_dep, axis);
2591           else
2592             pattern = targetm.gen_oacc_join (target, data_dep, axis);
2593         }
2594       else
2595         gcc_unreachable ();
2596       break;
2597     }
2598
2599   if (pattern)
2600     emit_insn (pattern);
2601 }
2602
2603 /* The size of an OpenACC compute dimension.  */
2604
2605 static void
2606 expand_GOACC_DIM_SIZE (internal_fn, gcall *stmt)
2607 {
2608   tree lhs = gimple_call_lhs (stmt);
2609
2610   if (!lhs)
2611     return;
2612
2613   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2614   if (targetm.have_oacc_dim_size ())
2615     {
2616       rtx dim = expand_expr (gimple_call_arg (stmt, 0), NULL_RTX,
2617                              VOIDmode, EXPAND_NORMAL);
2618       emit_insn (targetm.gen_oacc_dim_size (target, dim));
2619     }
2620   else
2621     emit_move_insn (target, GEN_INT (1));
2622 }
2623
2624 /* The position of an OpenACC execution engine along one compute axis.  */
2625
2626 static void
2627 expand_GOACC_DIM_POS (internal_fn, gcall *stmt)
2628 {
2629   tree lhs = gimple_call_lhs (stmt);
2630
2631   if (!lhs)
2632     return;
2633
2634   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2635   if (targetm.have_oacc_dim_pos ())
2636     {
2637       rtx dim = expand_expr (gimple_call_arg (stmt, 0), NULL_RTX,
2638                              VOIDmode, EXPAND_NORMAL);
2639       emit_insn (targetm.gen_oacc_dim_pos (target, dim));
2640     }
2641   else
2642     emit_move_insn (target, const0_rtx);
2643 }
2644
2645 /* This is expanded by oacc_device_lower pass.  */
2646
2647 static void
2648 expand_GOACC_LOOP (internal_fn, gcall *)
2649 {
2650   gcc_unreachable ();
2651 }
2652
2653 /* This is expanded by oacc_device_lower pass.  */
2654
2655 static void
2656 expand_GOACC_REDUCTION (internal_fn, gcall *)
2657 {
2658   gcc_unreachable ();
2659 }
2660
2661 /* This is expanded by oacc_device_lower pass.  */
2662
2663 static void
2664 expand_GOACC_TILE (internal_fn, gcall *)
2665 {
2666   gcc_unreachable ();
2667 }
2668
2669 /* Set errno to EDOM.  */
2670
2671 static void
2672 expand_SET_EDOM (internal_fn, gcall *)
2673 {
2674 #ifdef TARGET_EDOM
2675 #ifdef GEN_ERRNO_RTX
2676   rtx errno_rtx = GEN_ERRNO_RTX;
2677 #else
2678   rtx errno_rtx = gen_rtx_MEM (word_mode, gen_rtx_SYMBOL_REF (Pmode, "errno"));
2679 #endif
2680   emit_move_insn (errno_rtx,
2681                   gen_int_mode (TARGET_EDOM, GET_MODE (errno_rtx)));
2682 #else
2683   gcc_unreachable ();
2684 #endif
2685 }
2686
2687 /* Expand atomic bit test and set.  */
2688
2689 static void
2690 expand_ATOMIC_BIT_TEST_AND_SET (internal_fn, gcall *call)
2691 {
2692   expand_ifn_atomic_bit_test_and (call);
2693 }
2694
2695 /* Expand atomic bit test and complement.  */
2696
2697 static void
2698 expand_ATOMIC_BIT_TEST_AND_COMPLEMENT (internal_fn, gcall *call)
2699 {
2700   expand_ifn_atomic_bit_test_and (call);
2701 }
2702
2703 /* Expand atomic bit test and reset.  */
2704
2705 static void
2706 expand_ATOMIC_BIT_TEST_AND_RESET (internal_fn, gcall *call)
2707 {
2708   expand_ifn_atomic_bit_test_and (call);
2709 }
2710
2711 /* Expand atomic bit test and set.  */
2712
2713 static void
2714 expand_ATOMIC_COMPARE_EXCHANGE (internal_fn, gcall *call)
2715 {
2716   expand_ifn_atomic_compare_exchange (call);
2717 }
2718
2719 /* Expand LAUNDER to assignment, lhs = arg0.  */
2720
2721 static void
2722 expand_LAUNDER (internal_fn, gcall *call)
2723 {
2724   tree lhs = gimple_call_lhs (call);
2725
2726   if (!lhs)
2727     return;
2728
2729   expand_assignment (lhs, gimple_call_arg (call, 0), false);
2730 }
2731
2732 /* Expand DIVMOD() using:
2733  a) optab handler for udivmod/sdivmod if it is available.
2734  b) If optab_handler doesn't exist, generate call to
2735     target-specific divmod libfunc.  */
2736
2737 static void
2738 expand_DIVMOD (internal_fn, gcall *call_stmt)
2739 {
2740   tree lhs = gimple_call_lhs (call_stmt);
2741   tree arg0 = gimple_call_arg (call_stmt, 0);
2742   tree arg1 = gimple_call_arg (call_stmt, 1);
2743
2744   gcc_assert (TREE_CODE (TREE_TYPE (lhs)) == COMPLEX_TYPE);
2745   tree type = TREE_TYPE (TREE_TYPE (lhs));
2746   machine_mode mode = TYPE_MODE (type);
2747   bool unsignedp = TYPE_UNSIGNED (type);
2748   optab tab = (unsignedp) ? udivmod_optab : sdivmod_optab;
2749
2750   rtx op0 = expand_normal (arg0);
2751   rtx op1 = expand_normal (arg1);
2752   rtx target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2753
2754   rtx quotient, remainder, libfunc;
2755
2756   /* Check if optab_handler exists for divmod_optab for given mode.  */
2757   if (optab_handler (tab, mode) != CODE_FOR_nothing)
2758     {
2759       quotient = gen_reg_rtx (mode);
2760       remainder = gen_reg_rtx (mode);
2761       expand_twoval_binop (tab, op0, op1, quotient, remainder, unsignedp);
2762     }
2763
2764   /* Generate call to divmod libfunc if it exists.  */
2765   else if ((libfunc = optab_libfunc (tab, mode)) != NULL_RTX)
2766     targetm.expand_divmod_libfunc (libfunc, mode, op0, op1,
2767                                    &quotient, &remainder);
2768
2769   else
2770     gcc_unreachable ();
2771
2772   /* Wrap the return value (quotient, remainder) within COMPLEX_EXPR.  */
2773   expand_expr (build2 (COMPLEX_EXPR, TREE_TYPE (lhs),
2774                        make_tree (TREE_TYPE (arg0), quotient),
2775                        make_tree (TREE_TYPE (arg1), remainder)),
2776                target, VOIDmode, EXPAND_NORMAL);
2777 }
2778
2779 /* Expand a NOP.  */
2780
2781 static void
2782 expand_NOP (internal_fn, gcall *)
2783 {
2784   /* Nothing.  But it shouldn't really prevail.  */
2785 }
2786
2787 /* Expand a call to FN using the operands in STMT.  FN has a single
2788    output operand and NARGS input operands.  */
2789
2790 static void
2791 expand_direct_optab_fn (internal_fn fn, gcall *stmt, direct_optab optab,
2792                         unsigned int nargs)
2793 {
2794   expand_operand *ops = XALLOCAVEC (expand_operand, nargs + 1);
2795
2796   tree_pair types = direct_internal_fn_types (fn, stmt);
2797   insn_code icode = direct_optab_handler (optab, TYPE_MODE (types.first));
2798
2799   tree lhs = gimple_call_lhs (stmt);
2800   tree lhs_type = TREE_TYPE (lhs);
2801   rtx lhs_rtx = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2802
2803   /* Do not assign directly to a promoted subreg, since there is no
2804      guarantee that the instruction will leave the upper bits of the
2805      register in the state required by SUBREG_PROMOTED_SIGN.  */
2806   rtx dest = lhs_rtx;
2807   if (GET_CODE (dest) == SUBREG && SUBREG_PROMOTED_VAR_P (dest))
2808     dest = NULL_RTX;
2809
2810   create_output_operand (&ops[0], dest, insn_data[icode].operand[0].mode);
2811
2812   for (unsigned int i = 0; i < nargs; ++i)
2813     {
2814       tree rhs = gimple_call_arg (stmt, i);
2815       tree rhs_type = TREE_TYPE (rhs);
2816       rtx rhs_rtx = expand_normal (rhs);
2817       if (INTEGRAL_TYPE_P (rhs_type))
2818         create_convert_operand_from (&ops[i + 1], rhs_rtx,
2819                                      TYPE_MODE (rhs_type),
2820                                      TYPE_UNSIGNED (rhs_type));
2821       else
2822         create_input_operand (&ops[i + 1], rhs_rtx, TYPE_MODE (rhs_type));
2823     }
2824
2825   expand_insn (icode, nargs + 1, ops);
2826   if (!rtx_equal_p (lhs_rtx, ops[0].value))
2827     {
2828       /* If the return value has an integral type, convert the instruction
2829          result to that type.  This is useful for things that return an
2830          int regardless of the size of the input.  If the instruction result
2831          is smaller than required, assume that it is signed.
2832
2833          If the return value has a nonintegral type, its mode must match
2834          the instruction result.  */
2835       if (GET_CODE (lhs_rtx) == SUBREG && SUBREG_PROMOTED_VAR_P (lhs_rtx))
2836         {
2837           /* If this is a scalar in a register that is stored in a wider
2838              mode than the declared mode, compute the result into its
2839              declared mode and then convert to the wider mode.  */
2840           gcc_checking_assert (INTEGRAL_TYPE_P (lhs_type));
2841           rtx tmp = convert_to_mode (GET_MODE (lhs_rtx), ops[0].value, 0);
2842           convert_move (SUBREG_REG (lhs_rtx), tmp,
2843                         SUBREG_PROMOTED_SIGN (lhs_rtx));
2844         }
2845       else if (GET_MODE (lhs_rtx) == GET_MODE (ops[0].value))
2846         emit_move_insn (lhs_rtx, ops[0].value);
2847       else
2848         {
2849           gcc_checking_assert (INTEGRAL_TYPE_P (lhs_type));
2850           convert_move (lhs_rtx, ops[0].value, 0);
2851         }
2852     }
2853 }
2854
2855 /* Expand WHILE_ULT call STMT using optab OPTAB.  */
2856
2857 static void
2858 expand_while_optab_fn (internal_fn, gcall *stmt, convert_optab optab)
2859 {
2860   expand_operand ops[3];
2861   tree rhs_type[2];
2862
2863   tree lhs = gimple_call_lhs (stmt);
2864   tree lhs_type = TREE_TYPE (lhs);
2865   rtx lhs_rtx = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
2866   create_output_operand (&ops[0], lhs_rtx, TYPE_MODE (lhs_type));
2867
2868   for (unsigned int i = 0; i < 2; ++i)
2869     {
2870       tree rhs = gimple_call_arg (stmt, i);
2871       rhs_type[i] = TREE_TYPE (rhs);
2872       rtx rhs_rtx = expand_normal (rhs);
2873       create_input_operand (&ops[i + 1], rhs_rtx, TYPE_MODE (rhs_type[i]));
2874     }
2875
2876   insn_code icode = convert_optab_handler (optab, TYPE_MODE (rhs_type[0]),
2877                                            TYPE_MODE (lhs_type));
2878
2879   expand_insn (icode, 3, ops);
2880   if (!rtx_equal_p (lhs_rtx, ops[0].value))
2881     emit_move_insn (lhs_rtx, ops[0].value);
2882 }
2883
2884 /* Expanders for optabs that can use expand_direct_optab_fn.  */
2885
2886 #define expand_unary_optab_fn(FN, STMT, OPTAB) \
2887   expand_direct_optab_fn (FN, STMT, OPTAB, 1)
2888
2889 #define expand_binary_optab_fn(FN, STMT, OPTAB) \
2890   expand_direct_optab_fn (FN, STMT, OPTAB, 2)
2891
2892 #define expand_cond_unary_optab_fn(FN, STMT, OPTAB) \
2893   expand_direct_optab_fn (FN, STMT, OPTAB, 2)
2894
2895 #define expand_cond_binary_optab_fn(FN, STMT, OPTAB) \
2896   expand_direct_optab_fn (FN, STMT, OPTAB, 3)
2897
2898 #define expand_fold_extract_optab_fn(FN, STMT, OPTAB) \
2899   expand_direct_optab_fn (FN, STMT, OPTAB, 3)
2900
2901 #define expand_fold_left_optab_fn(FN, STMT, OPTAB) \
2902   expand_direct_optab_fn (FN, STMT, OPTAB, 2)
2903
2904 /* RETURN_TYPE and ARGS are a return type and argument list that are
2905    in principle compatible with FN (which satisfies direct_internal_fn_p).
2906    Return the types that should be used to determine whether the
2907    target supports FN.  */
2908
2909 tree_pair
2910 direct_internal_fn_types (internal_fn fn, tree return_type, tree *args)
2911 {
2912   const direct_internal_fn_info &info = direct_internal_fn (fn);
2913   tree type0 = (info.type0 < 0 ? return_type : TREE_TYPE (args[info.type0]));
2914   tree type1 = (info.type1 < 0 ? return_type : TREE_TYPE (args[info.type1]));
2915   return tree_pair (type0, type1);
2916 }
2917
2918 /* CALL is a call whose return type and arguments are in principle
2919    compatible with FN (which satisfies direct_internal_fn_p).  Return the
2920    types that should be used to determine whether the target supports FN.  */
2921
2922 tree_pair
2923 direct_internal_fn_types (internal_fn fn, gcall *call)
2924 {
2925   const direct_internal_fn_info &info = direct_internal_fn (fn);
2926   tree op0 = (info.type0 < 0
2927               ? gimple_call_lhs (call)
2928               : gimple_call_arg (call, info.type0));
2929   tree op1 = (info.type1 < 0
2930               ? gimple_call_lhs (call)
2931               : gimple_call_arg (call, info.type1));
2932   return tree_pair (TREE_TYPE (op0), TREE_TYPE (op1));
2933 }
2934
2935 /* Return true if OPTAB is supported for TYPES (whose modes should be
2936    the same) when the optimization type is OPT_TYPE.  Used for simple
2937    direct optabs.  */
2938
2939 static bool
2940 direct_optab_supported_p (direct_optab optab, tree_pair types,
2941                           optimization_type opt_type)
2942 {
2943   machine_mode mode = TYPE_MODE (types.first);
2944   gcc_checking_assert (mode == TYPE_MODE (types.second));
2945   return direct_optab_handler (optab, mode, opt_type) != CODE_FOR_nothing;
2946 }
2947
2948 /* Return true if OPTAB is supported for TYPES, where the first type
2949    is the destination and the second type is the source.  Used for
2950    convert optabs.  */
2951
2952 static bool
2953 convert_optab_supported_p (convert_optab optab, tree_pair types,
2954                            optimization_type opt_type)
2955 {
2956   return (convert_optab_handler (optab, TYPE_MODE (types.first),
2957                                  TYPE_MODE (types.second), opt_type)
2958           != CODE_FOR_nothing);
2959 }
2960
2961 /* Return true if load/store lanes optab OPTAB is supported for
2962    array type TYPES.first when the optimization type is OPT_TYPE.  */
2963
2964 static bool
2965 multi_vector_optab_supported_p (convert_optab optab, tree_pair types,
2966                                 optimization_type opt_type)
2967 {
2968   gcc_assert (TREE_CODE (types.first) == ARRAY_TYPE);
2969   machine_mode imode = TYPE_MODE (types.first);
2970   machine_mode vmode = TYPE_MODE (TREE_TYPE (types.first));
2971   return (convert_optab_handler (optab, imode, vmode, opt_type)
2972           != CODE_FOR_nothing);
2973 }
2974
2975 #define direct_unary_optab_supported_p direct_optab_supported_p
2976 #define direct_binary_optab_supported_p direct_optab_supported_p
2977 #define direct_cond_unary_optab_supported_p direct_optab_supported_p
2978 #define direct_cond_binary_optab_supported_p direct_optab_supported_p
2979 #define direct_mask_load_optab_supported_p direct_optab_supported_p
2980 #define direct_load_lanes_optab_supported_p multi_vector_optab_supported_p
2981 #define direct_mask_load_lanes_optab_supported_p multi_vector_optab_supported_p
2982 #define direct_mask_store_optab_supported_p direct_optab_supported_p
2983 #define direct_store_lanes_optab_supported_p multi_vector_optab_supported_p
2984 #define direct_mask_store_lanes_optab_supported_p multi_vector_optab_supported_p
2985 #define direct_while_optab_supported_p convert_optab_supported_p
2986 #define direct_fold_extract_optab_supported_p direct_optab_supported_p
2987 #define direct_fold_left_optab_supported_p direct_optab_supported_p
2988
2989 /* Return the optab used by internal function FN.  */
2990
2991 static optab
2992 direct_internal_fn_optab (internal_fn fn, tree_pair types)
2993 {
2994   switch (fn)
2995     {
2996 #define DEF_INTERNAL_FN(CODE, FLAGS, FNSPEC) \
2997     case IFN_##CODE: break;
2998 #define DEF_INTERNAL_OPTAB_FN(CODE, FLAGS, OPTAB, TYPE) \
2999     case IFN_##CODE: return OPTAB##_optab;
3000 #define DEF_INTERNAL_SIGNED_OPTAB_FN(CODE, FLAGS, SELECTOR, SIGNED_OPTAB, \
3001                                      UNSIGNED_OPTAB, TYPE)              \
3002     case IFN_##CODE: return (TYPE_UNSIGNED (types.SELECTOR)             \
3003                              ? UNSIGNED_OPTAB ## _optab                 \
3004                              : SIGNED_OPTAB ## _optab);
3005 #include "internal-fn.def"
3006
3007     case IFN_LAST:
3008       break;
3009     }
3010   gcc_unreachable ();
3011 }
3012
3013 /* Return true if FN is supported for the types in TYPES when the
3014    optimization type is OPT_TYPE.  The types are those associated with
3015    the "type0" and "type1" fields of FN's direct_internal_fn_info
3016    structure.  */
3017
3018 bool
3019 direct_internal_fn_supported_p (internal_fn fn, tree_pair types,
3020                                 optimization_type opt_type)
3021 {
3022   switch (fn)
3023     {
3024 #define DEF_INTERNAL_FN(CODE, FLAGS, FNSPEC) \
3025     case IFN_##CODE: break;
3026 #define DEF_INTERNAL_OPTAB_FN(CODE, FLAGS, OPTAB, TYPE) \
3027     case IFN_##CODE: \
3028       return direct_##TYPE##_optab_supported_p (OPTAB##_optab, types, \
3029                                                 opt_type);
3030 #define DEF_INTERNAL_SIGNED_OPTAB_FN(CODE, FLAGS, SELECTOR, SIGNED_OPTAB, \
3031                                      UNSIGNED_OPTAB, TYPE)              \
3032     case IFN_##CODE:                                                    \
3033       {                                                                 \
3034         optab which_optab = (TYPE_UNSIGNED (types.SELECTOR)             \
3035                              ? UNSIGNED_OPTAB ## _optab                 \
3036                              : SIGNED_OPTAB ## _optab);                 \
3037         return direct_##TYPE##_optab_supported_p (which_optab, types,   \
3038                                                   opt_type);            \
3039       }
3040 #include "internal-fn.def"
3041
3042     case IFN_LAST:
3043       break;
3044     }
3045   gcc_unreachable ();
3046 }
3047
3048 /* Return true if FN is supported for type TYPE when the optimization
3049    type is OPT_TYPE.  The caller knows that the "type0" and "type1"
3050    fields of FN's direct_internal_fn_info structure are the same.  */
3051
3052 bool
3053 direct_internal_fn_supported_p (internal_fn fn, tree type,
3054                                 optimization_type opt_type)
3055 {
3056   const direct_internal_fn_info &info = direct_internal_fn (fn);
3057   gcc_checking_assert (info.type0 == info.type1);
3058   return direct_internal_fn_supported_p (fn, tree_pair (type, type), opt_type);
3059 }
3060
3061 /* Return true if IFN_SET_EDOM is supported.  */
3062
3063 bool
3064 set_edom_supported_p (void)
3065 {
3066 #ifdef TARGET_EDOM
3067   return true;
3068 #else
3069   return false;
3070 #endif
3071 }
3072
3073 #define DEF_INTERNAL_OPTAB_FN(CODE, FLAGS, OPTAB, TYPE) \
3074   static void                                           \
3075   expand_##CODE (internal_fn fn, gcall *stmt)           \
3076   {                                                     \
3077     expand_##TYPE##_optab_fn (fn, stmt, OPTAB##_optab); \
3078   }
3079 #define DEF_INTERNAL_SIGNED_OPTAB_FN(CODE, FLAGS, SELECTOR, SIGNED_OPTAB, \
3080                                      UNSIGNED_OPTAB, TYPE)              \
3081   static void                                                           \
3082   expand_##CODE (internal_fn fn, gcall *stmt)                           \
3083   {                                                                     \
3084     tree_pair types = direct_internal_fn_types (fn, stmt);              \
3085     optab which_optab = direct_internal_fn_optab (fn, types);           \
3086     expand_##TYPE##_optab_fn (fn, stmt, which_optab);                   \
3087   }
3088 #include "internal-fn.def"
3089
3090 /* Routines to expand each internal function, indexed by function number.
3091    Each routine has the prototype:
3092
3093        expand_<NAME> (gcall *stmt)
3094
3095    where STMT is the statement that performs the call. */
3096 static void (*const internal_fn_expanders[]) (internal_fn, gcall *) = {
3097 #define DEF_INTERNAL_FN(CODE, FLAGS, FNSPEC) expand_##CODE,
3098 #include "internal-fn.def"
3099   0
3100 };
3101
3102 /* Return a function that performs the conditional form of CODE, i.e.:
3103
3104      LHS = RHS1 ? RHS2 CODE RHS3 : RHS2
3105
3106    (operating elementwise if the operands are vectors).  Return IFN_LAST
3107    if no such function exists.  */
3108
3109 internal_fn
3110 get_conditional_internal_fn (tree_code code)
3111 {
3112   switch (code)
3113     {
3114     case PLUS_EXPR:
3115       return IFN_COND_ADD;
3116     case MINUS_EXPR:
3117       return IFN_COND_SUB;
3118     case MIN_EXPR:
3119       return IFN_COND_MIN;
3120     case MAX_EXPR:
3121       return IFN_COND_MAX;
3122     case BIT_AND_EXPR:
3123       return IFN_COND_AND;
3124     case BIT_IOR_EXPR:
3125       return IFN_COND_IOR;
3126     case BIT_XOR_EXPR:
3127       return IFN_COND_XOR;
3128     default:
3129       return IFN_LAST;
3130     }
3131 }
3132
3133 /* Expand STMT as though it were a call to internal function FN.  */
3134
3135 void
3136 expand_internal_call (internal_fn fn, gcall *stmt)
3137 {
3138   internal_fn_expanders[fn] (fn, stmt);
3139 }
3140
3141 /* Expand STMT, which is a call to internal function FN.  */
3142
3143 void
3144 expand_internal_call (gcall *stmt)
3145 {
3146   expand_internal_call (gimple_call_internal_fn (stmt), stmt);
3147 }
3148
3149 void
3150 expand_PHI (internal_fn, gcall *)
3151 {
3152     gcc_unreachable ();
3153 }