gcc/tree-ssa-loop-niter.c

   1 /* Functions to determine/estimate number of iterations of a loop.
   2    Copyright (C) 2004-2015 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the
   8 Free Software Foundation; either version 3, or (at your option) any
   9 later version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT
  12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 #include "config.h"
  21 #include "system.h"
  22 #include "coretypes.h"
  23 #include "tm.h"
  24 #include "hash-set.h"
  25 #include "machmode.h"
  26 #include "vec.h"
  27 #include "double-int.h"
  28 #include "input.h"
  29 #include "alias.h"
  30 #include "symtab.h"
  31 #include "wide-int.h"
  32 #include "inchash.h"
  33 #include "tree.h"
  34 #include "stor-layout.h"
  35 #include "fold-const.h"
  36 #include "calls.h"
  37 #include "hashtab.h"
  38 #include "hard-reg-set.h"
  39 #include "function.h"
  40 #include "rtl.h"
  41 #include "flags.h"
  42 #include "statistics.h"
  43 #include "real.h"
  44 #include "fixed-value.h"
  45 #include "insn-config.h"
  46 #include "expmed.h"
  47 #include "dojump.h"
  48 #include "explow.h"
  49 #include "emit-rtl.h"
  50 #include "varasm.h"
  51 #include "stmt.h"
  52 #include "expr.h"
  53 #include "tm_p.h"
  54 #include "predict.h"
  55 #include "dominance.h"
  56 #include "cfg.h"
  57 #include "basic-block.h"
  58 #include "gimple-pretty-print.h"
  59 #include "intl.h"
  60 #include "tree-ssa-alias.h"
  61 #include "internal-fn.h"
  62 #include "gimple-expr.h"
  63 #include "is-a.h"
  64 #include "gimple.h"
  65 #include "gimplify.h"
  66 #include "gimple-iterator.h"
  67 #include "gimple-ssa.h"
  68 #include "tree-cfg.h"
  69 #include "tree-phinodes.h"
  70 #include "ssa-iterators.h"
  71 #include "tree-ssa-loop-ivopts.h"
  72 #include "tree-ssa-loop-niter.h"
  73 #include "tree-ssa-loop.h"
  74 #include "dumpfile.h"
  75 #include "cfgloop.h"
  76 #include "tree-chrec.h"
  77 #include "tree-scalar-evolution.h"
  78 #include "tree-data-ref.h"
  79 #include "params.h"
  80 #include "diagnostic-core.h"
  81 #include "tree-inline.h"
  82 #include "tree-pass.h"
  83 #include "stringpool.h"
  84 #include "tree-ssanames.h"
  85 #include "wide-int-print.h"
  86
  87
  88 #define SWAP(X, Y) do { affine_iv *tmp = (X); (X) = (Y); (Y) = tmp; } while (0)
  89
  90 /* The maximum number of dominator BBs we search for conditions
  91    of loop header copies we use for simplifying a conditional
  92    expression.  */
  93 #define MAX_DOMINATORS_TO_WALK 8
  94
  95 /*
  96
  97    Analysis of number of iterations of an affine exit test.
  98
  99 */
 100
 101 /* Bounds on some value, BELOW <= X <= UP.  */
 102
 103 typedef struct
 104 {
 105   mpz_t below, up;
 106 } bounds;
 107
 108
 109 /* Splits expression EXPR to a variable part VAR and constant OFFSET.  */
 110
 111 static void
 112 split_to_var_and_offset (tree expr, tree *var, mpz_t offset)
 113 {
 114   tree type = TREE_TYPE (expr);
 115   tree op0, op1;
 116   bool negate = false;
 117
 118   *var = expr;
 119   mpz_set_ui (offset, 0);
 120
 121   switch (TREE_CODE (expr))
 122     {
 123     case MINUS_EXPR:
 124       negate = true;
 125       /* Fallthru.  */
 126
 127     case PLUS_EXPR:
 128     case POINTER_PLUS_EXPR:
 129       op0 = TREE_OPERAND (expr, 0);
 130       op1 = TREE_OPERAND (expr, 1);
 131
 132       if (TREE_CODE (op1) != INTEGER_CST)
 133         break;
 134
 135       *var = op0;
 136       /* Always sign extend the offset.  */
 137       wi::to_mpz (op1, offset, SIGNED);
 138       if (negate)
 139         mpz_neg (offset, offset);
 140       break;
 141
 142     case INTEGER_CST:
 143       *var = build_int_cst_type (type, 0);
 144       wi::to_mpz (expr, offset, TYPE_SIGN (type));
 145       break;
 146
 147     default:
 148       break;
 149     }
 150 }
 151
 152 /* Stores estimate on the minimum/maximum value of the expression VAR + OFF
 153    in TYPE to MIN and MAX.  */
 154
 155 static void
 156 determine_value_range (struct loop *loop, tree type, tree var, mpz_t off,
 157                        mpz_t min, mpz_t max)
 158 {
 159   wide_int minv, maxv;
 160   enum value_range_type rtype = VR_VARYING;
 161
 162   /* If the expression is a constant, we know its value exactly.  */
 163   if (integer_zerop (var))
 164     {
 165       mpz_set (min, off);
 166       mpz_set (max, off);
 167       return;
 168     }
 169
 170   get_type_static_bounds (type, min, max);
 171
 172   /* See if we have some range info from VRP.  */
 173   if (TREE_CODE (var) == SSA_NAME && INTEGRAL_TYPE_P (type))
 174     {
 175       edge e = loop_preheader_edge (loop);
 176       signop sgn = TYPE_SIGN (type);
 177       gphi_iterator gsi;
 178
 179       /* Either for VAR itself...  */
 180       rtype = get_range_info (var, &minv, &maxv);
 181       /* Or for PHI results in loop->header where VAR is used as
 182          PHI argument from the loop preheader edge.  */
 183       for (gsi = gsi_start_phis (loop->header); !gsi_end_p (gsi); gsi_next (&gsi))
 184         {
 185           gphi *phi = gsi.phi ();
 186           wide_int minc, maxc;
 187           if (PHI_ARG_DEF_FROM_EDGE (phi, e) == var
 188               && (get_range_info (gimple_phi_result (phi), &minc, &maxc)
 189                   == VR_RANGE))
 190             {
 191               if (rtype != VR_RANGE)
 192                 {
 193                   rtype = VR_RANGE;
 194                   minv = minc;
 195                   maxv = maxc;
 196                 }
 197               else
 198                 {
 199                   minv = wi::max (minv, minc, sgn);
 200                   maxv = wi::min (maxv, maxc, sgn);
 201                   /* If the PHI result range are inconsistent with
 202                      the VAR range, give up on looking at the PHI
 203                      results.  This can happen if VR_UNDEFINED is
 204                      involved.  */
 205                   if (wi::gt_p (minv, maxv, sgn))
 206                     {
 207                       rtype = get_range_info (var, &minv, &maxv);
 208                       break;
 209                     }
 210                 }
 211             }
 212         }
 213       if (rtype == VR_RANGE)
 214         {
 215           mpz_t minm, maxm;
 216           gcc_assert (wi::le_p (minv, maxv, sgn));
 217           mpz_init (minm);
 218           mpz_init (maxm);
 219           wi::to_mpz (minv, minm, sgn);
 220           wi::to_mpz (maxv, maxm, sgn);
 221           mpz_add (minm, minm, off);
 222           mpz_add (maxm, maxm, off);
 223           /* If the computation may not wrap or off is zero, then this
 224              is always fine.  If off is negative and minv + off isn't
 225              smaller than type's minimum, or off is positive and
 226              maxv + off isn't bigger than type's maximum, use the more
 227              precise range too.  */
 228           if (nowrap_type_p (type)
 229               || mpz_sgn (off) == 0
 230               || (mpz_sgn (off) < 0 && mpz_cmp (minm, min) >= 0)
 231               || (mpz_sgn (off) > 0 && mpz_cmp (maxm, max) <= 0))
 232             {
 233               mpz_set (min, minm);
 234               mpz_set (max, maxm);
 235               mpz_clear (minm);
 236               mpz_clear (maxm);
 237               return;
 238             }
 239           mpz_clear (minm);
 240           mpz_clear (maxm);
 241         }
 242     }
 243
 244   /* If the computation may wrap, we know nothing about the value, except for
 245      the range of the type.  */
 246   if (!nowrap_type_p (type))
 247     return;
 248
 249   /* Since the addition of OFF does not wrap, if OFF is positive, then we may
 250      add it to MIN, otherwise to MAX.  */
 251   if (mpz_sgn (off) < 0)
 252     mpz_add (max, max, off);
 253   else
 254     mpz_add (min, min, off);
 255 }
 256
 257 /* Stores the bounds on the difference of the values of the expressions
 258    (var + X) and (var + Y), computed in TYPE, to BNDS.  */
 259
 260 static void
 261 bound_difference_of_offsetted_base (tree type, mpz_t x, mpz_t y,
 262                                     bounds *bnds)
 263 {
 264   int rel = mpz_cmp (x, y);
 265   bool may_wrap = !nowrap_type_p (type);
 266   mpz_t m;
 267
 268   /* If X == Y, then the expressions are always equal.
 269      If X > Y, there are the following possibilities:
 270        a) neither of var + X and var + Y overflow or underflow, or both of
 271           them do.  Then their difference is X - Y.
 272        b) var + X overflows, and var + Y does not.  Then the values of the
 273           expressions are var + X - M and var + Y, where M is the range of
 274           the type, and their difference is X - Y - M.
 275        c) var + Y underflows and var + X does not.  Their difference again
 276           is M - X + Y.
 277        Therefore, if the arithmetics in type does not overflow, then the
 278        bounds are (X - Y, X - Y), otherwise they are (X - Y - M, X - Y)
 279      Similarly, if X < Y, the bounds are either (X - Y, X - Y) or
 280      (X - Y, X - Y + M).  */
 281
 282   if (rel == 0)
 283     {
 284       mpz_set_ui (bnds->below, 0);
 285       mpz_set_ui (bnds->up, 0);
 286       return;
 287     }
 288
 289   mpz_init (m);
 290   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), m, UNSIGNED);
 291   mpz_add_ui (m, m, 1);
 292   mpz_sub (bnds->up, x, y);
 293   mpz_set (bnds->below, bnds->up);
 294
 295   if (may_wrap)
 296     {
 297       if (rel > 0)
 298         mpz_sub (bnds->below, bnds->below, m);
 299       else
 300         mpz_add (bnds->up, bnds->up, m);
 301     }
 302
 303   mpz_clear (m);
 304 }
 305
 306 /* From condition C0 CMP C1 derives information regarding the
 307    difference of values of VARX + OFFX and VARY + OFFY, computed in TYPE,
 308    and stores it to BNDS.  */
 309
 310 static void
 311 refine_bounds_using_guard (tree type, tree varx, mpz_t offx,
 312                            tree vary, mpz_t offy,
 313                            tree c0, enum tree_code cmp, tree c1,
 314                            bounds *bnds)
 315 {
 316   tree varc0, varc1, tmp, ctype;
 317   mpz_t offc0, offc1, loffx, loffy, bnd;
 318   bool lbound = false;
 319   bool no_wrap = nowrap_type_p (type);
 320   bool x_ok, y_ok;
 321
 322   switch (cmp)
 323     {
 324     case LT_EXPR:
 325     case LE_EXPR:
 326     case GT_EXPR:
 327     case GE_EXPR:
 328       STRIP_SIGN_NOPS (c0);
 329       STRIP_SIGN_NOPS (c1);
 330       ctype = TREE_TYPE (c0);
 331       if (!useless_type_conversion_p (ctype, type))
 332         return;
 333
 334       break;
 335
 336     case EQ_EXPR:
 337       /* We could derive quite precise information from EQ_EXPR, however, such
 338          a guard is unlikely to appear, so we do not bother with handling
 339          it.  */
 340       return;
 341
 342     case NE_EXPR:
 343       /* NE_EXPR comparisons do not contain much of useful information, except for
 344          special case of comparing with the bounds of the type.  */
 345       if (TREE_CODE (c1) != INTEGER_CST
 346           || !INTEGRAL_TYPE_P (type))
 347         return;
 348
 349       /* Ensure that the condition speaks about an expression in the same type
 350          as X and Y.  */
 351       ctype = TREE_TYPE (c0);
 352       if (TYPE_PRECISION (ctype) != TYPE_PRECISION (type))
 353         return;
 354       c0 = fold_convert (type, c0);
 355       c1 = fold_convert (type, c1);
 356
 357       if (TYPE_MIN_VALUE (type)
 358           && operand_equal_p (c1, TYPE_MIN_VALUE (type), 0))
 359         {
 360           cmp = GT_EXPR;
 361           break;
 362         }
 363       if (TYPE_MAX_VALUE (type)
 364           && operand_equal_p (c1, TYPE_MAX_VALUE (type), 0))
 365         {
 366           cmp = LT_EXPR;
 367           break;
 368         }
 369
 370       return;
 371     default:
 372       return;
 373     }
 374
 375   mpz_init (offc0);
 376   mpz_init (offc1);
 377   split_to_var_and_offset (expand_simple_operations (c0), &varc0, offc0);
 378   split_to_var_and_offset (expand_simple_operations (c1), &varc1, offc1);
 379
 380   /* We are only interested in comparisons of expressions based on VARX and
 381      VARY.  TODO -- we might also be able to derive some bounds from
 382      expressions containing just one of the variables.  */
 383
 384   if (operand_equal_p (varx, varc1, 0))
 385     {
 386       tmp = varc0; varc0 = varc1; varc1 = tmp;
 387       mpz_swap (offc0, offc1);
 388       cmp = swap_tree_comparison (cmp);
 389     }
 390
 391   if (!operand_equal_p (varx, varc0, 0)
 392       || !operand_equal_p (vary, varc1, 0))
 393     goto end;
 394
 395   mpz_init_set (loffx, offx);
 396   mpz_init_set (loffy, offy);
 397
 398   if (cmp == GT_EXPR || cmp == GE_EXPR)
 399     {
 400       tmp = varx; varx = vary; vary = tmp;
 401       mpz_swap (offc0, offc1);
 402       mpz_swap (loffx, loffy);
 403       cmp = swap_tree_comparison (cmp);
 404       lbound = true;
 405     }
 406
 407   /* If there is no overflow, the condition implies that
 408
 409      (VARX + OFFX) cmp (VARY + OFFY) + (OFFX - OFFY + OFFC1 - OFFC0).
 410
 411      The overflows and underflows may complicate things a bit; each
 412      overflow decreases the appropriate offset by M, and underflow
 413      increases it by M.  The above inequality would not necessarily be
 414      true if
 415
 416      -- VARX + OFFX underflows and VARX + OFFC0 does not, or
 417         VARX + OFFC0 overflows, but VARX + OFFX does not.
 418         This may only happen if OFFX < OFFC0.
 419      -- VARY + OFFY overflows and VARY + OFFC1 does not, or
 420         VARY + OFFC1 underflows and VARY + OFFY does not.
 421         This may only happen if OFFY > OFFC1.  */
 422
 423   if (no_wrap)
 424     {
 425       x_ok = true;
 426       y_ok = true;
 427     }
 428   else
 429     {
 430       x_ok = (integer_zerop (varx)
 431               || mpz_cmp (loffx, offc0) >= 0);
 432       y_ok = (integer_zerop (vary)
 433               || mpz_cmp (loffy, offc1) <= 0);
 434     }
 435
 436   if (x_ok && y_ok)
 437     {
 438       mpz_init (bnd);
 439       mpz_sub (bnd, loffx, loffy);
 440       mpz_add (bnd, bnd, offc1);
 441       mpz_sub (bnd, bnd, offc0);
 442
 443       if (cmp == LT_EXPR)
 444         mpz_sub_ui (bnd, bnd, 1);
 445
 446       if (lbound)
 447         {
 448           mpz_neg (bnd, bnd);
 449           if (mpz_cmp (bnds->below, bnd) < 0)
 450             mpz_set (bnds->below, bnd);
 451         }
 452       else
 453         {
 454           if (mpz_cmp (bnd, bnds->up) < 0)
 455             mpz_set (bnds->up, bnd);
 456         }
 457       mpz_clear (bnd);
 458     }
 459
 460   mpz_clear (loffx);
 461   mpz_clear (loffy);
 462 end:
 463   mpz_clear (offc0);
 464   mpz_clear (offc1);
 465 }
 466
 467 /* Stores the bounds on the value of the expression X - Y in LOOP to BNDS.
 468    The subtraction is considered to be performed in arbitrary precision,
 469    without overflows.
 470
 471    We do not attempt to be too clever regarding the value ranges of X and
 472    Y; most of the time, they are just integers or ssa names offsetted by
 473    integer.  However, we try to use the information contained in the
 474    comparisons before the loop (usually created by loop header copying).  */
 475
 476 static void
 477 bound_difference (struct loop *loop, tree x, tree y, bounds *bnds)
 478 {
 479   tree type = TREE_TYPE (x);
 480   tree varx, vary;
 481   mpz_t offx, offy;
 482   mpz_t minx, maxx, miny, maxy;
 483   int cnt = 0;
 484   edge e;
 485   basic_block bb;
 486   tree c0, c1;
 487   gimple cond;
 488   enum tree_code cmp;
 489
 490   /* Get rid of unnecessary casts, but preserve the value of
 491      the expressions.  */
 492   STRIP_SIGN_NOPS (x);
 493   STRIP_SIGN_NOPS (y);
 494
 495   mpz_init (bnds->below);
 496   mpz_init (bnds->up);
 497   mpz_init (offx);
 498   mpz_init (offy);
 499   split_to_var_and_offset (x, &varx, offx);
 500   split_to_var_and_offset (y, &vary, offy);
 501
 502   if (!integer_zerop (varx)
 503       && operand_equal_p (varx, vary, 0))
 504     {
 505       /* Special case VARX == VARY -- we just need to compare the
 506          offsets.  The matters are a bit more complicated in the
 507          case addition of offsets may wrap.  */
 508       bound_difference_of_offsetted_base (type, offx, offy, bnds);
 509     }
 510   else
 511     {
 512       /* Otherwise, use the value ranges to determine the initial
 513          estimates on below and up.  */
 514       mpz_init (minx);
 515       mpz_init (maxx);
 516       mpz_init (miny);
 517       mpz_init (maxy);
 518       determine_value_range (loop, type, varx, offx, minx, maxx);
 519       determine_value_range (loop, type, vary, offy, miny, maxy);
 520
 521       mpz_sub (bnds->below, minx, maxy);
 522       mpz_sub (bnds->up, maxx, miny);
 523       mpz_clear (minx);
 524       mpz_clear (maxx);
 525       mpz_clear (miny);
 526       mpz_clear (maxy);
 527     }
 528
 529   /* If both X and Y are constants, we cannot get any more precise.  */
 530   if (integer_zerop (varx) && integer_zerop (vary))
 531     goto end;
 532
 533   /* Now walk the dominators of the loop header and use the entry
 534      guards to refine the estimates.  */
 535   for (bb = loop->header;
 536        bb != ENTRY_BLOCK_PTR_FOR_FN (cfun) && cnt < MAX_DOMINATORS_TO_WALK;
 537        bb = get_immediate_dominator (CDI_DOMINATORS, bb))
 538     {
 539       if (!single_pred_p (bb))
 540         continue;
 541       e = single_pred_edge (bb);
 542
 543       if (!(e->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE)))
 544         continue;
 545
 546       cond = last_stmt (e->src);
 547       c0 = gimple_cond_lhs (cond);
 548       cmp = gimple_cond_code (cond);
 549       c1 = gimple_cond_rhs (cond);
 550
 551       if (e->flags & EDGE_FALSE_VALUE)
 552         cmp = invert_tree_comparison (cmp, false);
 553
 554       refine_bounds_using_guard (type, varx, offx, vary, offy,
 555                                  c0, cmp, c1, bnds);
 556       ++cnt;
 557     }
 558
 559 end:
 560   mpz_clear (offx);
 561   mpz_clear (offy);
 562 }
 563
 564 /* Update the bounds in BNDS that restrict the value of X to the bounds
 565    that restrict the value of X + DELTA.  X can be obtained as a
 566    difference of two values in TYPE.  */
 567
 568 static void
 569 bounds_add (bounds *bnds, const widest_int &delta, tree type)
 570 {
 571   mpz_t mdelta, max;
 572
 573   mpz_init (mdelta);
 574   wi::to_mpz (delta, mdelta, SIGNED);
 575
 576   mpz_init (max);
 577   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), max, UNSIGNED);
 578
 579   mpz_add (bnds->up, bnds->up, mdelta);
 580   mpz_add (bnds->below, bnds->below, mdelta);
 581
 582   if (mpz_cmp (bnds->up, max) > 0)
 583     mpz_set (bnds->up, max);
 584
 585   mpz_neg (max, max);
 586   if (mpz_cmp (bnds->below, max) < 0)
 587     mpz_set (bnds->below, max);
 588
 589   mpz_clear (mdelta);
 590   mpz_clear (max);
 591 }
 592
 593 /* Update the bounds in BNDS that restrict the value of X to the bounds
 594    that restrict the value of -X.  */
 595
 596 static void
 597 bounds_negate (bounds *bnds)
 598 {
 599   mpz_t tmp;
 600
 601   mpz_init_set (tmp, bnds->up);
 602   mpz_neg (bnds->up, bnds->below);
 603   mpz_neg (bnds->below, tmp);
 604   mpz_clear (tmp);
 605 }
 606
 607 /* Returns inverse of X modulo 2^s, where MASK = 2^s-1.  */
 608
 609 static tree
 610 inverse (tree x, tree mask)
 611 {
 612   tree type = TREE_TYPE (x);
 613   tree rslt;
 614   unsigned ctr = tree_floor_log2 (mask);
 615
 616   if (TYPE_PRECISION (type) <= HOST_BITS_PER_WIDE_INT)
 617     {
 618       unsigned HOST_WIDE_INT ix;
 619       unsigned HOST_WIDE_INT imask;
 620       unsigned HOST_WIDE_INT irslt = 1;
 621
 622       gcc_assert (cst_and_fits_in_hwi (x));
 623       gcc_assert (cst_and_fits_in_hwi (mask));
 624
 625       ix = int_cst_value (x);
 626       imask = int_cst_value (mask);
 627
 628       for (; ctr; ctr--)
 629         {
 630           irslt *= ix;
 631           ix *= ix;
 632         }
 633       irslt &= imask;
 634
 635       rslt = build_int_cst_type (type, irslt);
 636     }
 637   else
 638     {
 639       rslt = build_int_cst (type, 1);
 640       for (; ctr; ctr--)
 641         {
 642           rslt = int_const_binop (MULT_EXPR, rslt, x);
 643           x = int_const_binop (MULT_EXPR, x, x);
 644         }
 645       rslt = int_const_binop (BIT_AND_EXPR, rslt, mask);
 646     }
 647
 648   return rslt;
 649 }
 650
 651 /* Derives the upper bound BND on the number of executions of loop with exit
 652    condition S * i <> C.  If NO_OVERFLOW is true, then the control variable of
 653    the loop does not overflow.  EXIT_MUST_BE_TAKEN is true if we are guaranteed
 654    that the loop ends through this exit, i.e., the induction variable ever
 655    reaches the value of C.
 656
 657    The value C is equal to final - base, where final and base are the final and
 658    initial value of the actual induction variable in the analysed loop.  BNDS
 659    bounds the value of this difference when computed in signed type with
 660    unbounded range, while the computation of C is performed in an unsigned
 661    type with the range matching the range of the type of the induction variable.
 662    In particular, BNDS.up contains an upper bound on C in the following cases:
 663    -- if the iv must reach its final value without overflow, i.e., if
 664       NO_OVERFLOW && EXIT_MUST_BE_TAKEN is true, or
 665    -- if final >= base, which we know to hold when BNDS.below >= 0.  */
 666
 667 static void
 668 number_of_iterations_ne_max (mpz_t bnd, bool no_overflow, tree c, tree s,
 669                              bounds *bnds, bool exit_must_be_taken)
 670 {
 671   widest_int max;
 672   mpz_t d;
 673   tree type = TREE_TYPE (c);
 674   bool bnds_u_valid = ((no_overflow && exit_must_be_taken)
 675                        || mpz_sgn (bnds->below) >= 0);
 676
 677   if (integer_onep (s)
 678       || (TREE_CODE (c) == INTEGER_CST
 679           && TREE_CODE (s) == INTEGER_CST
 680           && wi::mod_trunc (c, s, TYPE_SIGN (type)) == 0)
 681       || (TYPE_OVERFLOW_UNDEFINED (type)
 682           && multiple_of_p (type, c, s)))
 683     {
 684       /* If C is an exact multiple of S, then its value will be reached before
 685          the induction variable overflows (unless the loop is exited in some
 686          other way before).  Note that the actual induction variable in the
 687          loop (which ranges from base to final instead of from 0 to C) may
 688          overflow, in which case BNDS.up will not be giving a correct upper
 689          bound on C; thus, BNDS_U_VALID had to be computed in advance.  */
 690       no_overflow = true;
 691       exit_must_be_taken = true;
 692     }
 693
 694   /* If the induction variable can overflow, the number of iterations is at
 695      most the period of the control variable (or infinite, but in that case
 696      the whole # of iterations analysis will fail).  */
 697   if (!no_overflow)
 698     {
 699       max = wi::mask <widest_int> (TYPE_PRECISION (type) - wi::ctz (s), false);
 700       wi::to_mpz (max, bnd, UNSIGNED);
 701       return;
 702     }
 703
 704   /* Now we know that the induction variable does not overflow, so the loop
 705      iterates at most (range of type / S) times.  */
 706   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), bnd, UNSIGNED);
 707
 708   /* If the induction variable is guaranteed to reach the value of C before
 709      overflow, ... */
 710   if (exit_must_be_taken)
 711     {
 712       /* ... then we can strengthen this to C / S, and possibly we can use
 713          the upper bound on C given by BNDS.  */
 714       if (TREE_CODE (c) == INTEGER_CST)
 715         wi::to_mpz (c, bnd, UNSIGNED);
 716       else if (bnds_u_valid)
 717         mpz_set (bnd, bnds->up);
 718     }
 719
 720   mpz_init (d);
 721   wi::to_mpz (s, d, UNSIGNED);
 722   mpz_fdiv_q (bnd, bnd, d);
 723   mpz_clear (d);
 724 }
 725
 726 /* Determines number of iterations of loop whose ending condition
 727    is IV <> FINAL.  TYPE is the type of the iv.  The number of
 728    iterations is stored to NITER.  EXIT_MUST_BE_TAKEN is true if
 729    we know that the exit must be taken eventually, i.e., that the IV
 730    ever reaches the value FINAL (we derived this earlier, and possibly set
 731    NITER->assumptions to make sure this is the case).  BNDS contains the
 732    bounds on the difference FINAL - IV->base.  */
 733
 734 static bool
 735 number_of_iterations_ne (tree type, affine_iv *iv, tree final,
 736                          struct tree_niter_desc *niter, bool exit_must_be_taken,
 737                          bounds *bnds)
 738 {
 739   tree niter_type = unsigned_type_for (type);
 740   tree s, c, d, bits, assumption, tmp, bound;
 741   mpz_t max;
 742
 743   niter->control = *iv;
 744   niter->bound = final;
 745   niter->cmp = NE_EXPR;
 746
 747   /* Rearrange the terms so that we get inequality S * i <> C, with S
 748      positive.  Also cast everything to the unsigned type.  If IV does
 749      not overflow, BNDS bounds the value of C.  Also, this is the
 750      case if the computation |FINAL - IV->base| does not overflow, i.e.,
 751      if BNDS->below in the result is nonnegative.  */
 752   if (tree_int_cst_sign_bit (iv->step))
 753     {
 754       s = fold_convert (niter_type,
 755                         fold_build1 (NEGATE_EXPR, type, iv->step));
 756       c = fold_build2 (MINUS_EXPR, niter_type,
 757                        fold_convert (niter_type, iv->base),
 758                        fold_convert (niter_type, final));
 759       bounds_negate (bnds);
 760     }
 761   else
 762     {
 763       s = fold_convert (niter_type, iv->step);
 764       c = fold_build2 (MINUS_EXPR, niter_type,
 765                        fold_convert (niter_type, final),
 766                        fold_convert (niter_type, iv->base));
 767     }
 768
 769   mpz_init (max);
 770   number_of_iterations_ne_max (max, iv->no_overflow, c, s, bnds,
 771                                exit_must_be_taken);
 772   niter->max = widest_int::from (wi::from_mpz (niter_type, max, false),
 773                                  TYPE_SIGN (niter_type));
 774   mpz_clear (max);
 775
 776   /* First the trivial cases -- when the step is 1.  */
 777   if (integer_onep (s))
 778     {
 779       niter->niter = c;
 780       return true;
 781     }
 782
 783   /* Let nsd (step, size of mode) = d.  If d does not divide c, the loop
 784      is infinite.  Otherwise, the number of iterations is
 785      (inverse(s/d) * (c/d)) mod (size of mode/d).  */
 786   bits = num_ending_zeros (s);
 787   bound = build_low_bits_mask (niter_type,
 788                                (TYPE_PRECISION (niter_type)
 789                                 - tree_to_uhwi (bits)));
 790
 791   d = fold_binary_to_constant (LSHIFT_EXPR, niter_type,
 792                                build_int_cst (niter_type, 1), bits);
 793   s = fold_binary_to_constant (RSHIFT_EXPR, niter_type, s, bits);
 794
 795   if (!exit_must_be_taken)
 796     {
 797       /* If we cannot assume that the exit is taken eventually, record the
 798          assumptions for divisibility of c.  */
 799       assumption = fold_build2 (FLOOR_MOD_EXPR, niter_type, c, d);
 800       assumption = fold_build2 (EQ_EXPR, boolean_type_node,
 801                                 assumption, build_int_cst (niter_type, 0));
 802       if (!integer_nonzerop (assumption))
 803         niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
 804                                           niter->assumptions, assumption);
 805     }
 806
 807   c = fold_build2 (EXACT_DIV_EXPR, niter_type, c, d);
 808   tmp = fold_build2 (MULT_EXPR, niter_type, c, inverse (s, bound));
 809   niter->niter = fold_build2 (BIT_AND_EXPR, niter_type, tmp, bound);
 810   return true;
 811 }
 812
 813 /* Checks whether we can determine the final value of the control variable
 814    of the loop with ending condition IV0 < IV1 (computed in TYPE).
 815    DELTA is the difference IV1->base - IV0->base, STEP is the absolute value
 816    of the step.  The assumptions necessary to ensure that the computation
 817    of the final value does not overflow are recorded in NITER.  If we
 818    find the final value, we adjust DELTA and return TRUE.  Otherwise
 819    we return false.  BNDS bounds the value of IV1->base - IV0->base,
 820    and will be updated by the same amount as DELTA.  EXIT_MUST_BE_TAKEN is
 821    true if we know that the exit must be taken eventually.  */
 822
 823 static bool
 824 number_of_iterations_lt_to_ne (tree type, affine_iv *iv0, affine_iv *iv1,
 825                                struct tree_niter_desc *niter,
 826                                tree *delta, tree step,
 827                                bool exit_must_be_taken, bounds *bnds)
 828 {
 829   tree niter_type = TREE_TYPE (step);
 830   tree mod = fold_build2 (FLOOR_MOD_EXPR, niter_type, *delta, step);
 831   tree tmod;
 832   mpz_t mmod;
 833   tree assumption = boolean_true_node, bound, noloop;
 834   bool ret = false, fv_comp_no_overflow;
 835   tree type1 = type;
 836   if (POINTER_TYPE_P (type))
 837     type1 = sizetype;
 838
 839   if (TREE_CODE (mod) != INTEGER_CST)
 840     return false;
 841   if (integer_nonzerop (mod))
 842     mod = fold_build2 (MINUS_EXPR, niter_type, step, mod);
 843   tmod = fold_convert (type1, mod);
 844
 845   mpz_init (mmod);
 846   wi::to_mpz (mod, mmod, UNSIGNED);
 847   mpz_neg (mmod, mmod);
 848
 849   /* If the induction variable does not overflow and the exit is taken,
 850      then the computation of the final value does not overflow.  This is
 851      also obviously the case if the new final value is equal to the
 852      current one.  Finally, we postulate this for pointer type variables,
 853      as the code cannot rely on the object to that the pointer points being
 854      placed at the end of the address space (and more pragmatically,
 855      TYPE_{MIN,MAX}_VALUE is not defined for pointers).  */
 856   if (integer_zerop (mod) || POINTER_TYPE_P (type))
 857     fv_comp_no_overflow = true;
 858   else if (!exit_must_be_taken)
 859     fv_comp_no_overflow = false;
 860   else
 861     fv_comp_no_overflow =
 862             (iv0->no_overflow && integer_nonzerop (iv0->step))
 863             || (iv1->no_overflow && integer_nonzerop (iv1->step));
 864
 865   if (integer_nonzerop (iv0->step))
 866     {
 867       /* The final value of the iv is iv1->base + MOD, assuming that this
 868          computation does not overflow, and that
 869          iv0->base <= iv1->base + MOD.  */
 870       if (!fv_comp_no_overflow)
 871         {
 872           bound = fold_build2 (MINUS_EXPR, type1,
 873                                TYPE_MAX_VALUE (type1), tmod);
 874           assumption = fold_build2 (LE_EXPR, boolean_type_node,
 875                                     iv1->base, bound);
 876           if (integer_zerop (assumption))
 877             goto end;
 878         }
 879       if (mpz_cmp (mmod, bnds->below) < 0)
 880         noloop = boolean_false_node;
 881       else if (POINTER_TYPE_P (type))
 882         noloop = fold_build2 (GT_EXPR, boolean_type_node,
 883                               iv0->base,
 884                               fold_build_pointer_plus (iv1->base, tmod));
 885       else
 886         noloop = fold_build2 (GT_EXPR, boolean_type_node,
 887                               iv0->base,
 888                               fold_build2 (PLUS_EXPR, type1,
 889                                            iv1->base, tmod));
 890     }
 891   else
 892     {
 893       /* The final value of the iv is iv0->base - MOD, assuming that this
 894          computation does not overflow, and that
 895          iv0->base - MOD <= iv1->base. */
 896       if (!fv_comp_no_overflow)
 897         {
 898           bound = fold_build2 (PLUS_EXPR, type1,
 899                                TYPE_MIN_VALUE (type1), tmod);
 900           assumption = fold_build2 (GE_EXPR, boolean_type_node,
 901                                     iv0->base, bound);
 902           if (integer_zerop (assumption))
 903             goto end;
 904         }
 905       if (mpz_cmp (mmod, bnds->below) < 0)
 906         noloop = boolean_false_node;
 907       else if (POINTER_TYPE_P (type))
 908         noloop = fold_build2 (GT_EXPR, boolean_type_node,
 909                               fold_build_pointer_plus (iv0->base,
 910                                                        fold_build1 (NEGATE_EXPR,
 911                                                                     type1, tmod)),
 912                               iv1->base);
 913       else
 914         noloop = fold_build2 (GT_EXPR, boolean_type_node,
 915                               fold_build2 (MINUS_EXPR, type1,
 916                                            iv0->base, tmod),
 917                               iv1->base);
 918     }
 919
 920   if (!integer_nonzerop (assumption))
 921     niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
 922                                       niter->assumptions,
 923                                       assumption);
 924   if (!integer_zerop (noloop))
 925     niter->may_be_zero = fold_build2 (TRUTH_OR_EXPR, boolean_type_node,
 926                                       niter->may_be_zero,
 927                                       noloop);
 928   bounds_add (bnds, wi::to_widest (mod), type);
 929   *delta = fold_build2 (PLUS_EXPR, niter_type, *delta, mod);
 930
 931   ret = true;
 932 end:
 933   mpz_clear (mmod);
 934   return ret;
 935 }
 936
 937 /* Add assertions to NITER that ensure that the control variable of the loop
 938    with ending condition IV0 < IV1 does not overflow.  Types of IV0 and IV1
 939    are TYPE.  Returns false if we can prove that there is an overflow, true
 940    otherwise.  STEP is the absolute value of the step.  */
 941
 942 static bool
 943 assert_no_overflow_lt (tree type, affine_iv *iv0, affine_iv *iv1,
 944                        struct tree_niter_desc *niter, tree step)
 945 {
 946   tree bound, d, assumption, diff;
 947   tree niter_type = TREE_TYPE (step);
 948
 949   if (integer_nonzerop (iv0->step))
 950     {
 951       /* for (i = iv0->base; i < iv1->base; i += iv0->step) */
 952       if (iv0->no_overflow)
 953         return true;
 954
 955       /* If iv0->base is a constant, we can determine the last value before
 956          overflow precisely; otherwise we conservatively assume
 957          MAX - STEP + 1.  */
 958
 959       if (TREE_CODE (iv0->base) == INTEGER_CST)
 960         {
 961           d = fold_build2 (MINUS_EXPR, niter_type,
 962                            fold_convert (niter_type, TYPE_MAX_VALUE (type)),
 963                            fold_convert (niter_type, iv0->base));
 964           diff = fold_build2 (FLOOR_MOD_EXPR, niter_type, d, step);
 965         }
 966       else
 967         diff = fold_build2 (MINUS_EXPR, niter_type, step,
 968                             build_int_cst (niter_type, 1));
 969       bound = fold_build2 (MINUS_EXPR, type,
 970                            TYPE_MAX_VALUE (type), fold_convert (type, diff));
 971       assumption = fold_build2 (LE_EXPR, boolean_type_node,
 972                                 iv1->base, bound);
 973     }
 974   else
 975     {
 976       /* for (i = iv1->base; i > iv0->base; i += iv1->step) */
 977       if (iv1->no_overflow)
 978         return true;
 979
 980       if (TREE_CODE (iv1->base) == INTEGER_CST)
 981         {
 982           d = fold_build2 (MINUS_EXPR, niter_type,
 983                            fold_convert (niter_type, iv1->base),
 984                            fold_convert (niter_type, TYPE_MIN_VALUE (type)));
 985           diff = fold_build2 (FLOOR_MOD_EXPR, niter_type, d, step);
 986         }
 987       else
 988         diff = fold_build2 (MINUS_EXPR, niter_type, step,
 989                             build_int_cst (niter_type, 1));
 990       bound = fold_build2 (PLUS_EXPR, type,
 991                            TYPE_MIN_VALUE (type), fold_convert (type, diff));
 992       assumption = fold_build2 (GE_EXPR, boolean_type_node,
 993                                 iv0->base, bound);
 994     }
 995
 996   if (integer_zerop (assumption))
 997     return false;
 998   if (!integer_nonzerop (assumption))
 999     niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1000                                       niter->assumptions, assumption);
1001
1002   iv0->no_overflow = true;
1003   iv1->no_overflow = true;
1004   return true;
1005 }
1006
1007 /* Add an assumption to NITER that a loop whose ending condition
1008    is IV0 < IV1 rolls.  TYPE is the type of the control iv.  BNDS
1009    bounds the value of IV1->base - IV0->base.  */
1010
1011 static void
1012 assert_loop_rolls_lt (tree type, affine_iv *iv0, affine_iv *iv1,
1013                       struct tree_niter_desc *niter, bounds *bnds)
1014 {
1015   tree assumption = boolean_true_node, bound, diff;
1016   tree mbz, mbzl, mbzr, type1;
1017   bool rolls_p, no_overflow_p;
1018   widest_int dstep;
1019   mpz_t mstep, max;
1020
1021   /* We are going to compute the number of iterations as
1022      (iv1->base - iv0->base + step - 1) / step, computed in the unsigned
1023      variant of TYPE.  This formula only works if
1024
1025      -step + 1 <= (iv1->base - iv0->base) <= MAX - step + 1
1026
1027      (where MAX is the maximum value of the unsigned variant of TYPE, and
1028      the computations in this formula are performed in full precision,
1029      i.e., without overflows).
1030
1031      Usually, for loops with exit condition iv0->base + step * i < iv1->base,
1032      we have a condition of the form iv0->base - step < iv1->base before the loop,
1033      and for loops iv0->base < iv1->base - step * i the condition
1034      iv0->base < iv1->base + step, due to loop header copying, which enable us
1035      to prove the lower bound.
1036
1037      The upper bound is more complicated.  Unless the expressions for initial
1038      and final value themselves contain enough information, we usually cannot
1039      derive it from the context.  */
1040
1041   /* First check whether the answer does not follow from the bounds we gathered
1042      before.  */
1043   if (integer_nonzerop (iv0->step))
1044     dstep = wi::to_widest (iv0->step);
1045   else
1046     {
1047       dstep = wi::sext (wi::to_widest (iv1->step), TYPE_PRECISION (type));
1048       dstep = -dstep;
1049     }
1050
1051   mpz_init (mstep);
1052   wi::to_mpz (dstep, mstep, UNSIGNED);
1053   mpz_neg (mstep, mstep);
1054   mpz_add_ui (mstep, mstep, 1);
1055
1056   rolls_p = mpz_cmp (mstep, bnds->below) <= 0;
1057
1058   mpz_init (max);
1059   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), max, UNSIGNED);
1060   mpz_add (max, max, mstep);
1061   no_overflow_p = (mpz_cmp (bnds->up, max) <= 0
1062                    /* For pointers, only values lying inside a single object
1063                       can be compared or manipulated by pointer arithmetics.
1064                       Gcc in general does not allow or handle objects larger
1065                       than half of the address space, hence the upper bound
1066                       is satisfied for pointers.  */
1067                    || POINTER_TYPE_P (type));
1068   mpz_clear (mstep);
1069   mpz_clear (max);
1070
1071   if (rolls_p && no_overflow_p)
1072     return;
1073
1074   type1 = type;
1075   if (POINTER_TYPE_P (type))
1076     type1 = sizetype;
1077
1078   /* Now the hard part; we must formulate the assumption(s) as expressions, and
1079      we must be careful not to introduce overflow.  */
1080
1081   if (integer_nonzerop (iv0->step))
1082     {
1083       diff = fold_build2 (MINUS_EXPR, type1,
1084                           iv0->step, build_int_cst (type1, 1));
1085
1086       /* We need to know that iv0->base >= MIN + iv0->step - 1.  Since
1087          0 address never belongs to any object, we can assume this for
1088          pointers.  */
1089       if (!POINTER_TYPE_P (type))
1090         {
1091           bound = fold_build2 (PLUS_EXPR, type1,
1092                                TYPE_MIN_VALUE (type), diff);
1093           assumption = fold_build2 (GE_EXPR, boolean_type_node,
1094                                     iv0->base, bound);
1095         }
1096
1097       /* And then we can compute iv0->base - diff, and compare it with
1098          iv1->base.  */
1099       mbzl = fold_build2 (MINUS_EXPR, type1,
1100                           fold_convert (type1, iv0->base), diff);
1101       mbzr = fold_convert (type1, iv1->base);
1102     }
1103   else
1104     {
1105       diff = fold_build2 (PLUS_EXPR, type1,
1106                           iv1->step, build_int_cst (type1, 1));
1107
1108       if (!POINTER_TYPE_P (type))
1109         {
1110           bound = fold_build2 (PLUS_EXPR, type1,
1111                                TYPE_MAX_VALUE (type), diff);
1112           assumption = fold_build2 (LE_EXPR, boolean_type_node,
1113                                     iv1->base, bound);
1114         }
1115
1116       mbzl = fold_convert (type1, iv0->base);
1117       mbzr = fold_build2 (MINUS_EXPR, type1,
1118                           fold_convert (type1, iv1->base), diff);
1119     }
1120
1121   if (!integer_nonzerop (assumption))
1122     niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1123                                       niter->assumptions, assumption);
1124   if (!rolls_p)
1125     {
1126       mbz = fold_build2 (GT_EXPR, boolean_type_node, mbzl, mbzr);
1127       niter->may_be_zero = fold_build2 (TRUTH_OR_EXPR, boolean_type_node,
1128                                         niter->may_be_zero, mbz);
1129     }
1130 }
1131
1132 /* Determines number of iterations of loop whose ending condition
1133    is IV0 < IV1.  TYPE is the type of the iv.  The number of
1134    iterations is stored to NITER.  BNDS bounds the difference
1135    IV1->base - IV0->base.  EXIT_MUST_BE_TAKEN is true if we know
1136    that the exit must be taken eventually.  */
1137
1138 static bool
1139 number_of_iterations_lt (tree type, affine_iv *iv0, affine_iv *iv1,
1140                          struct tree_niter_desc *niter,
1141                          bool exit_must_be_taken, bounds *bnds)
1142 {
1143   tree niter_type = unsigned_type_for (type);
1144   tree delta, step, s;
1145   mpz_t mstep, tmp;
1146
1147   if (integer_nonzerop (iv0->step))
1148     {
1149       niter->control = *iv0;
1150       niter->cmp = LT_EXPR;
1151       niter->bound = iv1->base;
1152     }
1153   else
1154     {
1155       niter->control = *iv1;
1156       niter->cmp = GT_EXPR;
1157       niter->bound = iv0->base;
1158     }
1159
1160   delta = fold_build2 (MINUS_EXPR, niter_type,
1161                        fold_convert (niter_type, iv1->base),
1162                        fold_convert (niter_type, iv0->base));
1163
1164   /* First handle the special case that the step is +-1.  */
1165   if ((integer_onep (iv0->step) && integer_zerop (iv1->step))
1166       || (integer_all_onesp (iv1->step) && integer_zerop (iv0->step)))
1167     {
1168       /* for (i = iv0->base; i < iv1->base; i++)
1169
1170          or
1171
1172          for (i = iv1->base; i > iv0->base; i--).
1173
1174          In both cases # of iterations is iv1->base - iv0->base, assuming that
1175          iv1->base >= iv0->base.
1176
1177          First try to derive a lower bound on the value of
1178          iv1->base - iv0->base, computed in full precision.  If the difference
1179          is nonnegative, we are done, otherwise we must record the
1180          condition.  */
1181
1182       if (mpz_sgn (bnds->below) < 0)
1183         niter->may_be_zero = fold_build2 (LT_EXPR, boolean_type_node,
1184                                           iv1->base, iv0->base);
1185       niter->niter = delta;
1186       niter->max = widest_int::from (wi::from_mpz (niter_type, bnds->up, false),
1187                                      TYPE_SIGN (niter_type));
1188       niter->control.no_overflow = true;
1189       return true;
1190     }
1191
1192   if (integer_nonzerop (iv0->step))
1193     step = fold_convert (niter_type, iv0->step);
1194   else
1195     step = fold_convert (niter_type,
1196                          fold_build1 (NEGATE_EXPR, type, iv1->step));
1197
1198   /* If we can determine the final value of the control iv exactly, we can
1199      transform the condition to != comparison.  In particular, this will be
1200      the case if DELTA is constant.  */
1201   if (number_of_iterations_lt_to_ne (type, iv0, iv1, niter, &delta, step,
1202                                      exit_must_be_taken, bnds))
1203     {
1204       affine_iv zps;
1205
1206       zps.base = build_int_cst (niter_type, 0);
1207       zps.step = step;
1208       /* number_of_iterations_lt_to_ne will add assumptions that ensure that
1209          zps does not overflow.  */
1210       zps.no_overflow = true;
1211
1212       return number_of_iterations_ne (type, &zps, delta, niter, true, bnds);
1213     }
1214
1215   /* Make sure that the control iv does not overflow.  */
1216   if (!assert_no_overflow_lt (type, iv0, iv1, niter, step))
1217     return false;
1218
1219   /* We determine the number of iterations as (delta + step - 1) / step.  For
1220      this to work, we must know that iv1->base >= iv0->base - step + 1,
1221      otherwise the loop does not roll.  */
1222   assert_loop_rolls_lt (type, iv0, iv1, niter, bnds);
1223
1224   s = fold_build2 (MINUS_EXPR, niter_type,
1225                    step, build_int_cst (niter_type, 1));
1226   delta = fold_build2 (PLUS_EXPR, niter_type, delta, s);
1227   niter->niter = fold_build2 (FLOOR_DIV_EXPR, niter_type, delta, step);
1228
1229   mpz_init (mstep);
1230   mpz_init (tmp);
1231   wi::to_mpz (step, mstep, UNSIGNED);
1232   mpz_add (tmp, bnds->up, mstep);
1233   mpz_sub_ui (tmp, tmp, 1);
1234   mpz_fdiv_q (tmp, tmp, mstep);
1235   niter->max = widest_int::from (wi::from_mpz (niter_type, tmp, false),
1236                                  TYPE_SIGN (niter_type));
1237   mpz_clear (mstep);
1238   mpz_clear (tmp);
1239
1240   return true;
1241 }
1242
1243 /* Determines number of iterations of loop whose ending condition
1244    is IV0 <= IV1.  TYPE is the type of the iv.  The number of
1245    iterations is stored to NITER.  EXIT_MUST_BE_TAKEN is true if
1246    we know that this condition must eventually become false (we derived this
1247    earlier, and possibly set NITER->assumptions to make sure this
1248    is the case).  BNDS bounds the difference IV1->base - IV0->base.  */
1249
1250 static bool
1251 number_of_iterations_le (tree type, affine_iv *iv0, affine_iv *iv1,
1252                          struct tree_niter_desc *niter, bool exit_must_be_taken,
1253                          bounds *bnds)
1254 {
1255   tree assumption;
1256   tree type1 = type;
1257   if (POINTER_TYPE_P (type))
1258     type1 = sizetype;
1259
1260   /* Say that IV0 is the control variable.  Then IV0 <= IV1 iff
1261      IV0 < IV1 + 1, assuming that IV1 is not equal to the greatest
1262      value of the type.  This we must know anyway, since if it is
1263      equal to this value, the loop rolls forever.  We do not check
1264      this condition for pointer type ivs, as the code cannot rely on
1265      the object to that the pointer points being placed at the end of
1266      the address space (and more pragmatically, TYPE_{MIN,MAX}_VALUE is
1267      not defined for pointers).  */
1268
1269   if (!exit_must_be_taken && !POINTER_TYPE_P (type))
1270     {
1271       if (integer_nonzerop (iv0->step))
1272         assumption = fold_build2 (NE_EXPR, boolean_type_node,
1273                                   iv1->base, TYPE_MAX_VALUE (type));
1274       else
1275         assumption = fold_build2 (NE_EXPR, boolean_type_node,
1276                                   iv0->base, TYPE_MIN_VALUE (type));
1277
1278       if (integer_zerop (assumption))
1279         return false;
1280       if (!integer_nonzerop (assumption))
1281         niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1282                                           niter->assumptions, assumption);
1283     }
1284
1285   if (integer_nonzerop (iv0->step))
1286     {
1287       if (POINTER_TYPE_P (type))
1288         iv1->base = fold_build_pointer_plus_hwi (iv1->base, 1);
1289       else
1290         iv1->base = fold_build2 (PLUS_EXPR, type1, iv1->base,
1291                                  build_int_cst (type1, 1));
1292     }
1293   else if (POINTER_TYPE_P (type))
1294     iv0->base = fold_build_pointer_plus_hwi (iv0->base, -1);
1295   else
1296     iv0->base = fold_build2 (MINUS_EXPR, type1,
1297                              iv0->base, build_int_cst (type1, 1));
1298
1299   bounds_add (bnds, 1, type1);
1300
1301   return number_of_iterations_lt (type, iv0, iv1, niter, exit_must_be_taken,
1302                                   bnds);
1303 }
1304
1305 /* Dumps description of affine induction variable IV to FILE.  */
1306
1307 static void
1308 dump_affine_iv (FILE *file, affine_iv *iv)
1309 {
1310   if (!integer_zerop (iv->step))
1311     fprintf (file, "[");
1312
1313   print_generic_expr (dump_file, iv->base, TDF_SLIM);
1314
1315   if (!integer_zerop (iv->step))
1316     {
1317       fprintf (file, ", + , ");
1318       print_generic_expr (dump_file, iv->step, TDF_SLIM);
1319       fprintf (file, "]%s", iv->no_overflow ? "(no_overflow)" : "");
1320     }
1321 }
1322
1323 /* Determine the number of iterations according to condition (for staying
1324    inside loop) which compares two induction variables using comparison
1325    operator CODE.  The induction variable on left side of the comparison
1326    is IV0, the right-hand side is IV1.  Both induction variables must have
1327    type TYPE, which must be an integer or pointer type.  The steps of the
1328    ivs must be constants (or NULL_TREE, which is interpreted as constant zero).
1329
1330    LOOP is the loop whose number of iterations we are determining.
1331
1332    ONLY_EXIT is true if we are sure this is the only way the loop could be
1333    exited (including possibly non-returning function calls, exceptions, etc.)
1334    -- in this case we can use the information whether the control induction
1335    variables can overflow or not in a more efficient way.
1336
1337    if EVERY_ITERATION is true, we know the test is executed on every iteration.
1338
1339    The results (number of iterations and assumptions as described in
1340    comments at struct tree_niter_desc in tree-ssa-loop.h) are stored to NITER.
1341    Returns false if it fails to determine number of iterations, true if it
1342    was determined (possibly with some assumptions).  */
1343
1344 static bool
1345 number_of_iterations_cond (struct loop *loop,
1346                            tree type, affine_iv *iv0, enum tree_code code,
1347                            affine_iv *iv1, struct tree_niter_desc *niter,
1348                            bool only_exit, bool every_iteration)
1349 {
1350   bool exit_must_be_taken = false, ret;
1351   bounds bnds;
1352
1353   /* If the test is not executed every iteration, wrapping may make the test
1354      to pass again.
1355      TODO: the overflow case can be still used as unreliable estimate of upper
1356      bound.  But we have no API to pass it down to number of iterations code
1357      and, at present, it will not use it anyway.  */
1358   if (!every_iteration
1359       && (!iv0->no_overflow || !iv1->no_overflow
1360           || code == NE_EXPR || code == EQ_EXPR))
1361     return false;
1362
1363   /* The meaning of these assumptions is this:
1364      if !assumptions
1365        then the rest of information does not have to be valid
1366      if may_be_zero then the loop does not roll, even if
1367        niter != 0.  */
1368   niter->assumptions = boolean_true_node;
1369   niter->may_be_zero = boolean_false_node;
1370   niter->niter = NULL_TREE;
1371   niter->max = 0;
1372   niter->bound = NULL_TREE;
1373   niter->cmp = ERROR_MARK;
1374
1375   /* Make < comparison from > ones, and for NE_EXPR comparisons, ensure that
1376      the control variable is on lhs.  */
1377   if (code == GE_EXPR || code == GT_EXPR
1378       || (code == NE_EXPR && integer_zerop (iv0->step)))
1379     {
1380       SWAP (iv0, iv1);
1381       code = swap_tree_comparison (code);
1382     }
1383
1384   if (POINTER_TYPE_P (type))
1385     {
1386       /* Comparison of pointers is undefined unless both iv0 and iv1 point
1387          to the same object.  If they do, the control variable cannot wrap
1388          (as wrap around the bounds of memory will never return a pointer
1389          that would be guaranteed to point to the same object, even if we
1390          avoid undefined behavior by casting to size_t and back).  */
1391       iv0->no_overflow = true;
1392       iv1->no_overflow = true;
1393     }
1394
1395   /* If the control induction variable does not overflow and the only exit
1396      from the loop is the one that we analyze, we know it must be taken
1397      eventually.  */
1398   if (only_exit)
1399     {
1400       if (!integer_zerop (iv0->step) && iv0->no_overflow)
1401         exit_must_be_taken = true;
1402       else if (!integer_zerop (iv1->step) && iv1->no_overflow)
1403         exit_must_be_taken = true;
1404     }
1405
1406   /* We can handle the case when neither of the sides of the comparison is
1407      invariant, provided that the test is NE_EXPR.  This rarely occurs in
1408      practice, but it is simple enough to manage.  */
1409   if (!integer_zerop (iv0->step) && !integer_zerop (iv1->step))
1410     {
1411       tree step_type = POINTER_TYPE_P (type) ? sizetype : type;
1412       if (code != NE_EXPR)
1413         return false;
1414
1415       iv0->step = fold_binary_to_constant (MINUS_EXPR, step_type,
1416                                            iv0->step, iv1->step);
1417       iv0->no_overflow = false;
1418       iv1->step = build_int_cst (step_type, 0);
1419       iv1->no_overflow = true;
1420     }
1421
1422   /* If the result of the comparison is a constant,  the loop is weird.  More
1423      precise handling would be possible, but the situation is not common enough
1424      to waste time on it.  */
1425   if (integer_zerop (iv0->step) && integer_zerop (iv1->step))
1426     return false;
1427
1428   /* Ignore loops of while (i-- < 10) type.  */
1429   if (code != NE_EXPR)
1430     {
1431       if (iv0->step && tree_int_cst_sign_bit (iv0->step))
1432         return false;
1433
1434       if (!integer_zerop (iv1->step) && !tree_int_cst_sign_bit (iv1->step))
1435         return false;
1436     }
1437
1438   /* If the loop exits immediately, there is nothing to do.  */
1439   tree tem = fold_binary (code, boolean_type_node, iv0->base, iv1->base);
1440   if (tem && integer_zerop (tem))
1441     {
1442       niter->niter = build_int_cst (unsigned_type_for (type), 0);
1443       niter->max = 0;
1444       return true;
1445     }
1446
1447   /* OK, now we know we have a senseful loop.  Handle several cases, depending
1448      on what comparison operator is used.  */
1449   bound_difference (loop, iv1->base, iv0->base, &bnds);
1450
1451   if (dump_file && (dump_flags & TDF_DETAILS))
1452     {
1453       fprintf (dump_file,
1454                "Analyzing # of iterations of loop %d\n", loop->num);
1455
1456       fprintf (dump_file, "  exit condition ");
1457       dump_affine_iv (dump_file, iv0);
1458       fprintf (dump_file, " %s ",
1459                code == NE_EXPR ? "!="
1460                : code == LT_EXPR ? "<"
1461                : "<=");
1462       dump_affine_iv (dump_file, iv1);
1463       fprintf (dump_file, "\n");
1464
1465       fprintf (dump_file, "  bounds on difference of bases: ");
1466       mpz_out_str (dump_file, 10, bnds.below);
1467       fprintf (dump_file, " ... ");
1468       mpz_out_str (dump_file, 10, bnds.up);
1469       fprintf (dump_file, "\n");
1470     }
1471
1472   switch (code)
1473     {
1474     case NE_EXPR:
1475       gcc_assert (integer_zerop (iv1->step));
1476       ret = number_of_iterations_ne (type, iv0, iv1->base, niter,
1477                                      exit_must_be_taken, &bnds);
1478       break;
1479
1480     case LT_EXPR:
1481       ret = number_of_iterations_lt (type, iv0, iv1, niter, exit_must_be_taken,
1482                                      &bnds);
1483       break;
1484
1485     case LE_EXPR:
1486       ret = number_of_iterations_le (type, iv0, iv1, niter, exit_must_be_taken,
1487                                      &bnds);
1488       break;
1489
1490     default:
1491       gcc_unreachable ();
1492     }
1493
1494   mpz_clear (bnds.up);
1495   mpz_clear (bnds.below);
1496
1497   if (dump_file && (dump_flags & TDF_DETAILS))
1498     {
1499       if (ret)
1500         {
1501           fprintf (dump_file, "  result:\n");
1502           if (!integer_nonzerop (niter->assumptions))
1503             {
1504               fprintf (dump_file, "    under assumptions ");
1505               print_generic_expr (dump_file, niter->assumptions, TDF_SLIM);
1506               fprintf (dump_file, "\n");
1507             }
1508
1509           if (!integer_zerop (niter->may_be_zero))
1510             {
1511               fprintf (dump_file, "    zero if ");
1512               print_generic_expr (dump_file, niter->may_be_zero, TDF_SLIM);
1513               fprintf (dump_file, "\n");
1514             }
1515
1516           fprintf (dump_file, "    # of iterations ");
1517           print_generic_expr (dump_file, niter->niter, TDF_SLIM);
1518           fprintf (dump_file, ", bounded by ");
1519           print_decu (niter->max, dump_file);
1520           fprintf (dump_file, "\n");
1521         }
1522       else
1523         fprintf (dump_file, "  failed\n\n");
1524     }
1525   return ret;
1526 }
1527
1528 /* Substitute NEW for OLD in EXPR and fold the result.  */
1529
1530 static tree
1531 simplify_replace_tree (tree expr, tree old, tree new_tree)
1532 {
1533   unsigned i, n;
1534   tree ret = NULL_TREE, e, se;
1535
1536   if (!expr)
1537     return NULL_TREE;
1538
1539   /* Do not bother to replace constants.  */
1540   if (CONSTANT_CLASS_P (old))
1541     return expr;
1542
1543   if (expr == old
1544       || operand_equal_p (expr, old, 0))
1545     return unshare_expr (new_tree);
1546
1547   if (!EXPR_P (expr))
1548     return expr;
1549
1550   n = TREE_OPERAND_LENGTH (expr);
1551   for (i = 0; i < n; i++)
1552     {
1553       e = TREE_OPERAND (expr, i);
1554       se = simplify_replace_tree (e, old, new_tree);
1555       if (e == se)
1556         continue;
1557
1558       if (!ret)
1559         ret = copy_node (expr);
1560
1561       TREE_OPERAND (ret, i) = se;
1562     }
1563
1564   return (ret ? fold (ret) : expr);
1565 }
1566
1567 /* Expand definitions of ssa names in EXPR as long as they are simple
1568    enough, and return the new expression.  If STOP is specified, stop
1569    expanding if EXPR equals to it.  */
1570
1571 tree
1572 expand_simple_operations (tree expr, tree stop)
1573 {
1574   unsigned i, n;
1575   tree ret = NULL_TREE, e, ee, e1;
1576   enum tree_code code;
1577   gimple stmt;
1578
1579   if (expr == NULL_TREE)
1580     return expr;
1581
1582   if (is_gimple_min_invariant (expr))
1583     return expr;
1584
1585   code = TREE_CODE (expr);
1586   if (IS_EXPR_CODE_CLASS (TREE_CODE_CLASS (code)))
1587     {
1588       n = TREE_OPERAND_LENGTH (expr);
1589       for (i = 0; i < n; i++)
1590         {
1591           e = TREE_OPERAND (expr, i);
1592           ee = expand_simple_operations (e, stop);
1593           if (e == ee)
1594             continue;
1595
1596           if (!ret)
1597             ret = copy_node (expr);
1598
1599           TREE_OPERAND (ret, i) = ee;
1600         }
1601
1602       if (!ret)
1603         return expr;
1604
1605       fold_defer_overflow_warnings ();
1606       ret = fold (ret);
1607       fold_undefer_and_ignore_overflow_warnings ();
1608       return ret;
1609     }
1610
1611   /* Stop if it's not ssa name or the one we don't want to expand.  */
1612   if (TREE_CODE (expr) != SSA_NAME || expr == stop)
1613     return expr;
1614
1615   stmt = SSA_NAME_DEF_STMT (expr);
1616   if (gimple_code (stmt) == GIMPLE_PHI)
1617     {
1618       basic_block src, dest;
1619
1620       if (gimple_phi_num_args (stmt) != 1)
1621         return expr;
1622       e = PHI_ARG_DEF (stmt, 0);
1623
1624       /* Avoid propagating through loop exit phi nodes, which
1625          could break loop-closed SSA form restrictions.  */
1626       dest = gimple_bb (stmt);
1627       src = single_pred (dest);
1628       if (TREE_CODE (e) == SSA_NAME
1629           && src->loop_father != dest->loop_father)
1630         return expr;
1631
1632       return expand_simple_operations (e, stop);
1633     }
1634   if (gimple_code (stmt) != GIMPLE_ASSIGN)
1635     return expr;
1636
1637   /* Avoid expanding to expressions that contain SSA names that need
1638      to take part in abnormal coalescing.  */
1639   ssa_op_iter iter;
1640   FOR_EACH_SSA_TREE_OPERAND (e, stmt, iter, SSA_OP_USE)
1641     if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (e))
1642       return expr;
1643
1644   e = gimple_assign_rhs1 (stmt);
1645   code = gimple_assign_rhs_code (stmt);
1646   if (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS)
1647     {
1648       if (is_gimple_min_invariant (e))
1649         return e;
1650
1651       if (code == SSA_NAME)
1652         return expand_simple_operations (e, stop);
1653
1654       return expr;
1655     }
1656
1657   switch (code)
1658     {
1659     CASE_CONVERT:
1660       /* Casts are simple.  */
1661       ee = expand_simple_operations (e, stop);
1662       return fold_build1 (code, TREE_TYPE (expr), ee);
1663
1664     case PLUS_EXPR:
1665     case MINUS_EXPR:
1666       if (ANY_INTEGRAL_TYPE_P (TREE_TYPE (expr))
1667           && TYPE_OVERFLOW_TRAPS (TREE_TYPE (expr)))
1668         return expr;
1669       /* Fallthru.  */
1670     case POINTER_PLUS_EXPR:
1671       /* And increments and decrements by a constant are simple.  */
1672       e1 = gimple_assign_rhs2 (stmt);
1673       if (!is_gimple_min_invariant (e1))
1674         return expr;
1675
1676       ee = expand_simple_operations (e, stop);
1677       return fold_build2 (code, TREE_TYPE (expr), ee, e1);
1678
1679     default:
1680       return expr;
1681     }
1682 }
1683
1684 /* Tries to simplify EXPR using the condition COND.  Returns the simplified
1685    expression (or EXPR unchanged, if no simplification was possible).  */
1686
1687 static tree
1688 tree_simplify_using_condition_1 (tree cond, tree expr)
1689 {
1690   bool changed;
1691   tree e, te, e0, e1, e2, notcond;
1692   enum tree_code code = TREE_CODE (expr);
1693
1694   if (code == INTEGER_CST)
1695     return expr;
1696
1697   if (code == TRUTH_OR_EXPR
1698       || code == TRUTH_AND_EXPR
1699       || code == COND_EXPR)
1700     {
1701       changed = false;
1702
1703       e0 = tree_simplify_using_condition_1 (cond, TREE_OPERAND (expr, 0));
1704       if (TREE_OPERAND (expr, 0) != e0)
1705         changed = true;
1706
1707       e1 = tree_simplify_using_condition_1 (cond, TREE_OPERAND (expr, 1));
1708       if (TREE_OPERAND (expr, 1) != e1)
1709         changed = true;
1710
1711       if (code == COND_EXPR)
1712         {
1713           e2 = tree_simplify_using_condition_1 (cond, TREE_OPERAND (expr, 2));
1714           if (TREE_OPERAND (expr, 2) != e2)
1715             changed = true;
1716         }
1717       else
1718         e2 = NULL_TREE;
1719
1720       if (changed)
1721         {
1722           if (code == COND_EXPR)
1723             expr = fold_build3 (code, boolean_type_node, e0, e1, e2);
1724           else
1725             expr = fold_build2 (code, boolean_type_node, e0, e1);
1726         }
1727
1728       return expr;
1729     }
1730
1731   /* In case COND is equality, we may be able to simplify EXPR by copy/constant
1732      propagation, and vice versa.  Fold does not handle this, since it is
1733      considered too expensive.  */
1734   if (TREE_CODE (cond) == EQ_EXPR)
1735     {
1736       e0 = TREE_OPERAND (cond, 0);
1737       e1 = TREE_OPERAND (cond, 1);
1738
1739       /* We know that e0 == e1.  Check whether we cannot simplify expr
1740          using this fact.  */
1741       e = simplify_replace_tree (expr, e0, e1);
1742       if (integer_zerop (e) || integer_nonzerop (e))
1743         return e;
1744
1745       e = simplify_replace_tree (expr, e1, e0);
1746       if (integer_zerop (e) || integer_nonzerop (e))
1747         return e;
1748     }
1749   if (TREE_CODE (expr) == EQ_EXPR)
1750     {
1751       e0 = TREE_OPERAND (expr, 0);
1752       e1 = TREE_OPERAND (expr, 1);
1753
1754       /* If e0 == e1 (EXPR) implies !COND, then EXPR cannot be true.  */
1755       e = simplify_replace_tree (cond, e0, e1);
1756       if (integer_zerop (e))
1757         return e;
1758       e = simplify_replace_tree (cond, e1, e0);
1759       if (integer_zerop (e))
1760         return e;
1761     }
1762   if (TREE_CODE (expr) == NE_EXPR)
1763     {
1764       e0 = TREE_OPERAND (expr, 0);
1765       e1 = TREE_OPERAND (expr, 1);
1766
1767       /* If e0 == e1 (!EXPR) implies !COND, then EXPR must be true.  */
1768       e = simplify_replace_tree (cond, e0, e1);
1769       if (integer_zerop (e))
1770         return boolean_true_node;
1771       e = simplify_replace_tree (cond, e1, e0);
1772       if (integer_zerop (e))
1773         return boolean_true_node;
1774     }
1775
1776   te = expand_simple_operations (expr);
1777
1778   /* Check whether COND ==> EXPR.  */
1779   notcond = invert_truthvalue (cond);
1780   e = fold_binary (TRUTH_OR_EXPR, boolean_type_node, notcond, te);
1781   if (e && integer_nonzerop (e))
1782     return e;
1783
1784   /* Check whether COND ==> not EXPR.  */
1785   e = fold_binary (TRUTH_AND_EXPR, boolean_type_node, cond, te);
1786   if (e && integer_zerop (e))
1787     return e;
1788
1789   return expr;
1790 }
1791
1792 /* Tries to simplify EXPR using the condition COND.  Returns the simplified
1793    expression (or EXPR unchanged, if no simplification was possible).
1794    Wrapper around tree_simplify_using_condition_1 that ensures that chains
1795    of simple operations in definitions of ssa names in COND are expanded,
1796    so that things like casts or incrementing the value of the bound before
1797    the loop do not cause us to fail.  */
1798
1799 static tree
1800 tree_simplify_using_condition (tree cond, tree expr)
1801 {
1802   cond = expand_simple_operations (cond);
1803
1804   return tree_simplify_using_condition_1 (cond, expr);
1805 }
1806
1807 /* Tries to simplify EXPR using the conditions on entry to LOOP.
1808    Returns the simplified expression (or EXPR unchanged, if no
1809    simplification was possible).*/
1810
1811 static tree
1812 simplify_using_initial_conditions (struct loop *loop, tree expr)
1813 {
1814   edge e;
1815   basic_block bb;
1816   gimple stmt;
1817   tree cond;
1818   int cnt = 0;
1819
1820   if (TREE_CODE (expr) == INTEGER_CST)
1821     return expr;
1822
1823   /* Limit walking the dominators to avoid quadraticness in
1824      the number of BBs times the number of loops in degenerate
1825      cases.  */
1826   for (bb = loop->header;
1827        bb != ENTRY_BLOCK_PTR_FOR_FN (cfun) && cnt < MAX_DOMINATORS_TO_WALK;
1828        bb = get_immediate_dominator (CDI_DOMINATORS, bb))
1829     {
1830       if (!single_pred_p (bb))
1831         continue;
1832       e = single_pred_edge (bb);
1833
1834       if (!(e->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE)))
1835         continue;
1836
1837       stmt = last_stmt (e->src);
1838       cond = fold_build2 (gimple_cond_code (stmt),
1839                           boolean_type_node,
1840                           gimple_cond_lhs (stmt),
1841                           gimple_cond_rhs (stmt));
1842       if (e->flags & EDGE_FALSE_VALUE)
1843         cond = invert_truthvalue (cond);
1844       expr = tree_simplify_using_condition (cond, expr);
1845       ++cnt;
1846     }
1847
1848   return expr;
1849 }
1850
1851 /* Tries to simplify EXPR using the evolutions of the loop invariants
1852    in the superloops of LOOP.  Returns the simplified expression
1853    (or EXPR unchanged, if no simplification was possible).  */
1854
1855 static tree
1856 simplify_using_outer_evolutions (struct loop *loop, tree expr)
1857 {
1858   enum tree_code code = TREE_CODE (expr);
1859   bool changed;
1860   tree e, e0, e1, e2;
1861
1862   if (is_gimple_min_invariant (expr))
1863     return expr;
1864
1865   if (code == TRUTH_OR_EXPR
1866       || code == TRUTH_AND_EXPR
1867       || code == COND_EXPR)
1868     {
1869       changed = false;
1870
1871       e0 = simplify_using_outer_evolutions (loop, TREE_OPERAND (expr, 0));
1872       if (TREE_OPERAND (expr, 0) != e0)
1873         changed = true;
1874
1875       e1 = simplify_using_outer_evolutions (loop, TREE_OPERAND (expr, 1));
1876       if (TREE_OPERAND (expr, 1) != e1)
1877         changed = true;
1878
1879       if (code == COND_EXPR)
1880         {
1881           e2 = simplify_using_outer_evolutions (loop, TREE_OPERAND (expr, 2));
1882           if (TREE_OPERAND (expr, 2) != e2)
1883             changed = true;
1884         }
1885       else
1886         e2 = NULL_TREE;
1887
1888       if (changed)
1889         {
1890           if (code == COND_EXPR)
1891             expr = fold_build3 (code, boolean_type_node, e0, e1, e2);
1892           else
1893             expr = fold_build2 (code, boolean_type_node, e0, e1);
1894         }
1895
1896       return expr;
1897     }
1898
1899   e = instantiate_parameters (loop, expr);
1900   if (is_gimple_min_invariant (e))
1901     return e;
1902
1903   return expr;
1904 }
1905
1906 /* Returns true if EXIT is the only possible exit from LOOP.  */
1907
1908 bool
1909 loop_only_exit_p (const struct loop *loop, const_edge exit)
1910 {
1911   basic_block *body;
1912   gimple_stmt_iterator bsi;
1913   unsigned i;
1914   gimple call;
1915
1916   if (exit != single_exit (loop))
1917     return false;
1918
1919   body = get_loop_body (loop);
1920   for (i = 0; i < loop->num_nodes; i++)
1921     {
1922       for (bsi = gsi_start_bb (body[i]); !gsi_end_p (bsi); gsi_next (&bsi))
1923         {
1924           call = gsi_stmt (bsi);
1925           if (gimple_code (call) != GIMPLE_CALL)
1926             continue;
1927
1928           if (gimple_has_side_effects (call))
1929             {
1930               free (body);
1931               return false;
1932             }
1933         }
1934     }
1935
1936   free (body);
1937   return true;
1938 }
1939
1940 /* Stores description of number of iterations of LOOP derived from
1941    EXIT (an exit edge of the LOOP) in NITER.  Returns true if some
1942    useful information could be derived (and fields of NITER has
1943    meaning described in comments at struct tree_niter_desc
1944    declaration), false otherwise.  If WARN is true and
1945    -Wunsafe-loop-optimizations was given, warn if the optimizer is going to use
1946    potentially unsafe assumptions.
1947    When EVERY_ITERATION is true, only tests that are known to be executed
1948    every iteration are considered (i.e. only test that alone bounds the loop).
1949  */
1950
1951 bool
1952 number_of_iterations_exit (struct loop *loop, edge exit,
1953                            struct tree_niter_desc *niter,
1954                            bool warn, bool every_iteration)
1955 {
1956   gimple last;
1957   gcond *stmt;
1958   tree type;
1959   tree op0, op1;
1960   enum tree_code code;
1961   affine_iv iv0, iv1;
1962   bool safe;
1963
1964   safe = dominated_by_p (CDI_DOMINATORS, loop->latch, exit->src);
1965
1966   if (every_iteration && !safe)
1967     return false;
1968
1969   niter->assumptions = boolean_false_node;
1970   niter->control.base = NULL_TREE;
1971   niter->control.step = NULL_TREE;
1972   niter->control.no_overflow = false;
1973   last = last_stmt (exit->src);
1974   if (!last)
1975     return false;
1976   stmt = dyn_cast <gcond *> (last);
1977   if (!stmt)
1978     return false;
1979
1980   /* We want the condition for staying inside loop.  */
1981   code = gimple_cond_code (stmt);
1982   if (exit->flags & EDGE_TRUE_VALUE)
1983     code = invert_tree_comparison (code, false);
1984
1985   switch (code)
1986     {
1987     case GT_EXPR:
1988     case GE_EXPR:
1989     case LT_EXPR:
1990     case LE_EXPR:
1991     case NE_EXPR:
1992       break;
1993
1994     default:
1995       return false;
1996     }
1997
1998   op0 = gimple_cond_lhs (stmt);
1999   op1 = gimple_cond_rhs (stmt);
2000   type = TREE_TYPE (op0);
2001
2002   if (TREE_CODE (type) != INTEGER_TYPE
2003       && !POINTER_TYPE_P (type))
2004     return false;
2005
2006   if (!simple_iv (loop, loop_containing_stmt (stmt), op0, &iv0, false))
2007     return false;
2008   if (!simple_iv (loop, loop_containing_stmt (stmt), op1, &iv1, false))
2009     return false;
2010
2011   /* We don't want to see undefined signed overflow warnings while
2012      computing the number of iterations.  */
2013   fold_defer_overflow_warnings ();
2014
2015   iv0.base = expand_simple_operations (iv0.base);
2016   iv1.base = expand_simple_operations (iv1.base);
2017   if (!number_of_iterations_cond (loop, type, &iv0, code, &iv1, niter,
2018                                   loop_only_exit_p (loop, exit), safe))
2019     {
2020       fold_undefer_and_ignore_overflow_warnings ();
2021       return false;
2022     }
2023
2024   if (optimize >= 3)
2025     {
2026       niter->assumptions = simplify_using_outer_evolutions (loop,
2027                                                             niter->assumptions);
2028       niter->may_be_zero = simplify_using_outer_evolutions (loop,
2029                                                             niter->may_be_zero);
2030       niter->niter = simplify_using_outer_evolutions (loop, niter->niter);
2031     }
2032
2033   niter->assumptions
2034           = simplify_using_initial_conditions (loop,
2035                                                niter->assumptions);
2036   niter->may_be_zero
2037           = simplify_using_initial_conditions (loop,
2038                                                niter->may_be_zero);
2039
2040   fold_undefer_and_ignore_overflow_warnings ();
2041
2042   /* If NITER has simplified into a constant, update MAX.  */
2043   if (TREE_CODE (niter->niter) == INTEGER_CST)
2044     niter->max = wi::to_widest (niter->niter);
2045
2046   if (integer_onep (niter->assumptions))
2047     return true;
2048
2049   /* With -funsafe-loop-optimizations we assume that nothing bad can happen.
2050      But if we can prove that there is overflow or some other source of weird
2051      behavior, ignore the loop even with -funsafe-loop-optimizations.  */
2052   if (integer_zerop (niter->assumptions) || !single_exit (loop))
2053     return false;
2054
2055   if (flag_unsafe_loop_optimizations)
2056     niter->assumptions = boolean_true_node;
2057
2058   if (warn)
2059     {
2060       const char *wording;
2061       location_t loc = gimple_location (stmt);
2062
2063       /* We can provide a more specific warning if one of the operator is
2064          constant and the other advances by +1 or -1.  */
2065       if (!integer_zerop (iv1.step)
2066           ? (integer_zerop (iv0.step)
2067              && (integer_onep (iv1.step) || integer_all_onesp (iv1.step)))
2068           : (integer_onep (iv0.step) || integer_all_onesp (iv0.step)))
2069         wording =
2070           flag_unsafe_loop_optimizations
2071           ? N_("assuming that the loop is not infinite")
2072           : N_("cannot optimize possibly infinite loops");
2073       else
2074         wording =
2075           flag_unsafe_loop_optimizations
2076           ? N_("assuming that the loop counter does not overflow")
2077           : N_("cannot optimize loop, the loop counter may overflow");
2078
2079       warning_at ((LOCATION_LINE (loc) > 0) ? loc : input_location,
2080                   OPT_Wunsafe_loop_optimizations, "%s", gettext (wording));
2081     }
2082
2083   return flag_unsafe_loop_optimizations;
2084 }
2085
2086 /* Try to determine the number of iterations of LOOP.  If we succeed,
2087    expression giving number of iterations is returned and *EXIT is
2088    set to the edge from that the information is obtained.  Otherwise
2089    chrec_dont_know is returned.  */
2090
2091 tree
2092 find_loop_niter (struct loop *loop, edge *exit)
2093 {
2094   unsigned i;
2095   vec<edge> exits = get_loop_exit_edges (loop);
2096   edge ex;
2097   tree niter = NULL_TREE, aniter;
2098   struct tree_niter_desc desc;
2099
2100   *exit = NULL;
2101   FOR_EACH_VEC_ELT (exits, i, ex)
2102     {
2103       if (!number_of_iterations_exit (loop, ex, &desc, false))
2104         continue;
2105
2106       if (integer_nonzerop (desc.may_be_zero))
2107         {
2108           /* We exit in the first iteration through this exit.
2109              We won't find anything better.  */
2110           niter = build_int_cst (unsigned_type_node, 0);
2111           *exit = ex;
2112           break;
2113         }
2114
2115       if (!integer_zerop (desc.may_be_zero))
2116         continue;
2117
2118       aniter = desc.niter;
2119
2120       if (!niter)
2121         {
2122           /* Nothing recorded yet.  */
2123           niter = aniter;
2124           *exit = ex;
2125           continue;
2126         }
2127
2128       /* Prefer constants, the lower the better.  */
2129       if (TREE_CODE (aniter) != INTEGER_CST)
2130         continue;
2131
2132       if (TREE_CODE (niter) != INTEGER_CST)
2133         {
2134           niter = aniter;
2135           *exit = ex;
2136           continue;
2137         }
2138
2139       if (tree_int_cst_lt (aniter, niter))
2140         {
2141           niter = aniter;
2142           *exit = ex;
2143           continue;
2144         }
2145     }
2146   exits.release ();
2147
2148   return niter ? niter : chrec_dont_know;
2149 }
2150
2151 /* Return true if loop is known to have bounded number of iterations.  */
2152
2153 bool
2154 finite_loop_p (struct loop *loop)
2155 {
2156   widest_int nit;
2157   int flags;
2158
2159   if (flag_unsafe_loop_optimizations)
2160     return true;
2161   flags = flags_from_decl_or_type (current_function_decl);
2162   if ((flags & (ECF_CONST|ECF_PURE)) && !(flags & ECF_LOOPING_CONST_OR_PURE))
2163     {
2164       if (dump_file && (dump_flags & TDF_DETAILS))
2165         fprintf (dump_file, "Found loop %i to be finite: it is within pure or const function.\n",
2166                  loop->num);
2167       return true;
2168     }
2169
2170   if (loop->any_upper_bound
2171       || max_loop_iterations (loop, &nit))
2172     {
2173       if (dump_file && (dump_flags & TDF_DETAILS))
2174         fprintf (dump_file, "Found loop %i to be finite: upper bound found.\n",
2175                  loop->num);
2176       return true;
2177     }
2178   return false;
2179 }
2180
2181 /*
2182
2183    Analysis of a number of iterations of a loop by a brute-force evaluation.
2184
2185 */
2186
2187 /* Bound on the number of iterations we try to evaluate.  */
2188
2189 #define MAX_ITERATIONS_TO_TRACK \
2190   ((unsigned) PARAM_VALUE (PARAM_MAX_ITERATIONS_TO_TRACK))
2191
2192 /* Returns the loop phi node of LOOP such that ssa name X is derived from its
2193    result by a chain of operations such that all but exactly one of their
2194    operands are constants.  */
2195
2196 static gphi *
2197 chain_of_csts_start (struct loop *loop, tree x)
2198 {
2199   gimple stmt = SSA_NAME_DEF_STMT (x);
2200   tree use;
2201   basic_block bb = gimple_bb (stmt);
2202   enum tree_code code;
2203
2204   if (!bb
2205       || !flow_bb_inside_loop_p (loop, bb))
2206     return NULL;
2207
2208   if (gimple_code (stmt) == GIMPLE_PHI)
2209     {
2210       if (bb == loop->header)
2211         return as_a <gphi *> (stmt);
2212
2213       return NULL;
2214     }
2215
2216   if (gimple_code (stmt) != GIMPLE_ASSIGN
2217       || gimple_assign_rhs_class (stmt) == GIMPLE_TERNARY_RHS)
2218     return NULL;
2219
2220   code = gimple_assign_rhs_code (stmt);
2221   if (gimple_references_memory_p (stmt)
2222       || TREE_CODE_CLASS (code) == tcc_reference
2223       || (code == ADDR_EXPR
2224           && !is_gimple_min_invariant (gimple_assign_rhs1 (stmt))))
2225     return NULL;
2226
2227   use = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
2228   if (use == NULL_TREE)
2229     return NULL;
2230
2231   return chain_of_csts_start (loop, use);
2232 }
2233
2234 /* Determines whether the expression X is derived from a result of a phi node
2235    in header of LOOP such that
2236
2237    * the derivation of X consists only from operations with constants
2238    * the initial value of the phi node is constant
2239    * the value of the phi node in the next iteration can be derived from the
2240      value in the current iteration by a chain of operations with constants.
2241
2242    If such phi node exists, it is returned, otherwise NULL is returned.  */
2243
2244 static gphi *
2245 get_base_for (struct loop *loop, tree x)
2246 {
2247   gphi *phi;
2248   tree init, next;
2249
2250   if (is_gimple_min_invariant (x))
2251     return NULL;
2252
2253   phi = chain_of_csts_start (loop, x);
2254   if (!phi)
2255     return NULL;
2256
2257   init = PHI_ARG_DEF_FROM_EDGE (phi, loop_preheader_edge (loop));
2258   next = PHI_ARG_DEF_FROM_EDGE (phi, loop_latch_edge (loop));
2259
2260   if (TREE_CODE (next) != SSA_NAME)
2261     return NULL;
2262
2263   if (!is_gimple_min_invariant (init))
2264     return NULL;
2265
2266   if (chain_of_csts_start (loop, next) != phi)
2267     return NULL;
2268
2269   return phi;
2270 }
2271
2272 /* Given an expression X, then
2273
2274    * if X is NULL_TREE, we return the constant BASE.
2275    * otherwise X is a SSA name, whose value in the considered loop is derived
2276      by a chain of operations with constant from a result of a phi node in
2277      the header of the loop.  Then we return value of X when the value of the
2278      result of this phi node is given by the constant BASE.  */
2279
2280 static tree
2281 get_val_for (tree x, tree base)
2282 {
2283   gimple stmt;
2284
2285   gcc_checking_assert (is_gimple_min_invariant (base));
2286
2287   if (!x)
2288     return base;
2289
2290   stmt = SSA_NAME_DEF_STMT (x);
2291   if (gimple_code (stmt) == GIMPLE_PHI)
2292     return base;
2293
2294   gcc_checking_assert (is_gimple_assign (stmt));
2295
2296   /* STMT must be either an assignment of a single SSA name or an
2297      expression involving an SSA name and a constant.  Try to fold that
2298      expression using the value for the SSA name.  */
2299   if (gimple_assign_ssa_name_copy_p (stmt))
2300     return get_val_for (gimple_assign_rhs1 (stmt), base);
2301   else if (gimple_assign_rhs_class (stmt) == GIMPLE_UNARY_RHS
2302            && TREE_CODE (gimple_assign_rhs1 (stmt)) == SSA_NAME)
2303     {
2304       return fold_build1 (gimple_assign_rhs_code (stmt),
2305                           gimple_expr_type (stmt),
2306                           get_val_for (gimple_assign_rhs1 (stmt), base));
2307     }
2308   else if (gimple_assign_rhs_class (stmt) == GIMPLE_BINARY_RHS)
2309     {
2310       tree rhs1 = gimple_assign_rhs1 (stmt);
2311       tree rhs2 = gimple_assign_rhs2 (stmt);
2312       if (TREE_CODE (rhs1) == SSA_NAME)
2313         rhs1 = get_val_for (rhs1, base);
2314       else if (TREE_CODE (rhs2) == SSA_NAME)
2315         rhs2 = get_val_for (rhs2, base);
2316       else
2317         gcc_unreachable ();
2318       return fold_build2 (gimple_assign_rhs_code (stmt),
2319                           gimple_expr_type (stmt), rhs1, rhs2);
2320     }
2321   else
2322     gcc_unreachable ();
2323 }
2324
2325
2326 /* Tries to count the number of iterations of LOOP till it exits by EXIT
2327    by brute force -- i.e. by determining the value of the operands of the
2328    condition at EXIT in first few iterations of the loop (assuming that
2329    these values are constant) and determining the first one in that the
2330    condition is not satisfied.  Returns the constant giving the number
2331    of the iterations of LOOP if successful, chrec_dont_know otherwise.  */
2332
2333 tree
2334 loop_niter_by_eval (struct loop *loop, edge exit)
2335 {
2336   tree acnd;
2337   tree op[2], val[2], next[2], aval[2];
2338   gphi *phi;
2339   gimple cond;
2340   unsigned i, j;
2341   enum tree_code cmp;
2342
2343   cond = last_stmt (exit->src);
2344   if (!cond || gimple_code (cond) != GIMPLE_COND)
2345     return chrec_dont_know;
2346
2347   cmp = gimple_cond_code (cond);
2348   if (exit->flags & EDGE_TRUE_VALUE)
2349     cmp = invert_tree_comparison (cmp, false);
2350
2351   switch (cmp)
2352     {
2353     case EQ_EXPR:
2354     case NE_EXPR:
2355     case GT_EXPR:
2356     case GE_EXPR:
2357     case LT_EXPR:
2358     case LE_EXPR:
2359       op[0] = gimple_cond_lhs (cond);
2360       op[1] = gimple_cond_rhs (cond);
2361       break;
2362
2363     default:
2364       return chrec_dont_know;
2365     }
2366
2367   for (j = 0; j < 2; j++)
2368     {
2369       if (is_gimple_min_invariant (op[j]))
2370         {
2371           val[j] = op[j];
2372           next[j] = NULL_TREE;
2373           op[j] = NULL_TREE;
2374         }
2375       else
2376         {
2377           phi = get_base_for (loop, op[j]);
2378           if (!phi)
2379             return chrec_dont_know;
2380           val[j] = PHI_ARG_DEF_FROM_EDGE (phi, loop_preheader_edge (loop));
2381           next[j] = PHI_ARG_DEF_FROM_EDGE (phi, loop_latch_edge (loop));
2382         }
2383     }
2384
2385   /* Don't issue signed overflow warnings.  */
2386   fold_defer_overflow_warnings ();
2387
2388   for (i = 0; i < MAX_ITERATIONS_TO_TRACK; i++)
2389     {
2390       for (j = 0; j < 2; j++)
2391         aval[j] = get_val_for (op[j], val[j]);
2392
2393       acnd = fold_binary (cmp, boolean_type_node, aval[0], aval[1]);
2394       if (acnd && integer_zerop (acnd))
2395         {
2396           fold_undefer_and_ignore_overflow_warnings ();
2397           if (dump_file && (dump_flags & TDF_DETAILS))
2398             fprintf (dump_file,
2399                      "Proved that loop %d iterates %d times using brute force.\n",
2400                      loop->num, i);
2401           return build_int_cst (unsigned_type_node, i);
2402         }
2403
2404       for (j = 0; j < 2; j++)
2405         {
2406           val[j] = get_val_for (next[j], val[j]);
2407           if (!is_gimple_min_invariant (val[j]))
2408             {
2409               fold_undefer_and_ignore_overflow_warnings ();
2410               return chrec_dont_know;
2411             }
2412         }
2413     }
2414
2415   fold_undefer_and_ignore_overflow_warnings ();
2416
2417   return chrec_dont_know;
2418 }
2419
2420 /* Finds the exit of the LOOP by that the loop exits after a constant
2421    number of iterations and stores the exit edge to *EXIT.  The constant
2422    giving the number of iterations of LOOP is returned.  The number of
2423    iterations is determined using loop_niter_by_eval (i.e. by brute force
2424    evaluation).  If we are unable to find the exit for that loop_niter_by_eval
2425    determines the number of iterations, chrec_dont_know is returned.  */
2426
2427 tree
2428 find_loop_niter_by_eval (struct loop *loop, edge *exit)
2429 {
2430   unsigned i;
2431   vec<edge> exits = get_loop_exit_edges (loop);
2432   edge ex;
2433   tree niter = NULL_TREE, aniter;
2434
2435   *exit = NULL;
2436
2437   /* Loops with multiple exits are expensive to handle and less important.  */
2438   if (!flag_expensive_optimizations
2439       && exits.length () > 1)
2440     {
2441       exits.release ();
2442       return chrec_dont_know;
2443     }
2444
2445   FOR_EACH_VEC_ELT (exits, i, ex)
2446     {
2447       if (!just_once_each_iteration_p (loop, ex->src))
2448         continue;
2449
2450       aniter = loop_niter_by_eval (loop, ex);
2451       if (chrec_contains_undetermined (aniter))
2452         continue;
2453
2454       if (niter
2455           && !tree_int_cst_lt (aniter, niter))
2456         continue;
2457
2458       niter = aniter;
2459       *exit = ex;
2460     }
2461   exits.release ();
2462
2463   return niter ? niter : chrec_dont_know;
2464 }
2465
2466 /*
2467
2468    Analysis of upper bounds on number of iterations of a loop.
2469
2470 */
2471
2472 static widest_int derive_constant_upper_bound_ops (tree, tree,
2473                                                    enum tree_code, tree);
2474
2475 /* Returns a constant upper bound on the value of the right-hand side of
2476    an assignment statement STMT.  */
2477
2478 static widest_int
2479 derive_constant_upper_bound_assign (gimple stmt)
2480 {
2481   enum tree_code code = gimple_assign_rhs_code (stmt);
2482   tree op0 = gimple_assign_rhs1 (stmt);
2483   tree op1 = gimple_assign_rhs2 (stmt);
2484
2485   return derive_constant_upper_bound_ops (TREE_TYPE (gimple_assign_lhs (stmt)),
2486                                           op0, code, op1);
2487 }
2488
2489 /* Returns a constant upper bound on the value of expression VAL.  VAL
2490    is considered to be unsigned.  If its type is signed, its value must
2491    be nonnegative.  */
2492
2493 static widest_int
2494 derive_constant_upper_bound (tree val)
2495 {
2496   enum tree_code code;
2497   tree op0, op1;
2498
2499   extract_ops_from_tree (val, &code, &op0, &op1);
2500   return derive_constant_upper_bound_ops (TREE_TYPE (val), op0, code, op1);
2501 }
2502
2503 /* Returns a constant upper bound on the value of expression OP0 CODE OP1,
2504    whose type is TYPE.  The expression is considered to be unsigned.  If
2505    its type is signed, its value must be nonnegative.  */
2506
2507 static widest_int
2508 derive_constant_upper_bound_ops (tree type, tree op0,
2509                                  enum tree_code code, tree op1)
2510 {
2511   tree subtype, maxt;
2512   widest_int bnd, max, mmax, cst;
2513   gimple stmt;
2514
2515   if (INTEGRAL_TYPE_P (type))
2516     maxt = TYPE_MAX_VALUE (type);
2517   else
2518     maxt = upper_bound_in_type (type, type);
2519
2520   max = wi::to_widest (maxt);
2521
2522   switch (code)
2523     {
2524     case INTEGER_CST:
2525       return wi::to_widest (op0);
2526
2527     CASE_CONVERT:
2528       subtype = TREE_TYPE (op0);
2529       if (!TYPE_UNSIGNED (subtype)
2530           /* If TYPE is also signed, the fact that VAL is nonnegative implies
2531              that OP0 is nonnegative.  */
2532           && TYPE_UNSIGNED (type)
2533           && !tree_expr_nonnegative_p (op0))
2534         {
2535           /* If we cannot prove that the casted expression is nonnegative,
2536              we cannot establish more useful upper bound than the precision
2537              of the type gives us.  */
2538           return max;
2539         }
2540
2541       /* We now know that op0 is an nonnegative value.  Try deriving an upper
2542          bound for it.  */
2543       bnd = derive_constant_upper_bound (op0);
2544
2545       /* If the bound does not fit in TYPE, max. value of TYPE could be
2546          attained.  */
2547       if (wi::ltu_p (max, bnd))
2548         return max;
2549
2550       return bnd;
2551
2552     case PLUS_EXPR:
2553     case POINTER_PLUS_EXPR:
2554     case MINUS_EXPR:
2555       if (TREE_CODE (op1) != INTEGER_CST
2556           || !tree_expr_nonnegative_p (op0))
2557         return max;
2558
2559       /* Canonicalize to OP0 - CST.  Consider CST to be signed, in order to
2560          choose the most logical way how to treat this constant regardless
2561          of the signedness of the type.  */
2562       cst = wi::sext (wi::to_widest (op1), TYPE_PRECISION (type));
2563       if (code != MINUS_EXPR)
2564         cst = -cst;
2565
2566       bnd = derive_constant_upper_bound (op0);
2567
2568       if (wi::neg_p (cst))
2569         {
2570           cst = -cst;
2571           /* Avoid CST == 0x80000...  */
2572           if (wi::neg_p (cst))
2573             return max;
2574
2575           /* OP0 + CST.  We need to check that
2576              BND <= MAX (type) - CST.  */
2577
2578           mmax -= cst;
2579           if (wi::ltu_p (bnd, max))
2580             return max;
2581
2582           return bnd + cst;
2583         }
2584       else
2585         {
2586           /* OP0 - CST, where CST >= 0.
2587
2588              If TYPE is signed, we have already verified that OP0 >= 0, and we
2589              know that the result is nonnegative.  This implies that
2590              VAL <= BND - CST.
2591
2592              If TYPE is unsigned, we must additionally know that OP0 >= CST,
2593              otherwise the operation underflows.
2594            */
2595
2596           /* This should only happen if the type is unsigned; however, for
2597              buggy programs that use overflowing signed arithmetics even with
2598              -fno-wrapv, this condition may also be true for signed values.  */
2599           if (wi::ltu_p (bnd, cst))
2600             return max;
2601
2602           if (TYPE_UNSIGNED (type))
2603             {
2604               tree tem = fold_binary (GE_EXPR, boolean_type_node, op0,
2605                                       wide_int_to_tree (type, cst));
2606               if (!tem || integer_nonzerop (tem))
2607                 return max;
2608             }
2609
2610           bnd -= cst;
2611         }
2612
2613       return bnd;
2614
2615     case FLOOR_DIV_EXPR:
2616     case EXACT_DIV_EXPR:
2617       if (TREE_CODE (op1) != INTEGER_CST
2618           || tree_int_cst_sign_bit (op1))
2619         return max;
2620
2621       bnd = derive_constant_upper_bound (op0);
2622       return wi::udiv_floor (bnd, wi::to_widest (op1));
2623
2624     case BIT_AND_EXPR:
2625       if (TREE_CODE (op1) != INTEGER_CST
2626           || tree_int_cst_sign_bit (op1))
2627         return max;
2628       return wi::to_widest (op1);
2629
2630     case SSA_NAME:
2631       stmt = SSA_NAME_DEF_STMT (op0);
2632       if (gimple_code (stmt) != GIMPLE_ASSIGN
2633           || gimple_assign_lhs (stmt) != op0)
2634         return max;
2635       return derive_constant_upper_bound_assign (stmt);
2636
2637     default:
2638       return max;
2639     }
2640 }
2641
2642 /* Emit a -Waggressive-loop-optimizations warning if needed.  */
2643
2644 static void
2645 do_warn_aggressive_loop_optimizations (struct loop *loop,
2646                                        widest_int i_bound, gimple stmt)
2647 {
2648   /* Don't warn if the loop doesn't have known constant bound.  */
2649   if (!loop->nb_iterations
2650       || TREE_CODE (loop->nb_iterations) != INTEGER_CST
2651       || !warn_aggressive_loop_optimizations
2652       /* To avoid warning multiple times for the same loop,
2653          only start warning when we preserve loops.  */
2654       || (cfun->curr_properties & PROP_loops) == 0
2655       /* Only warn once per loop.  */
2656       || loop->warned_aggressive_loop_optimizations
2657       /* Only warn if undefined behavior gives us lower estimate than the
2658          known constant bound.  */
2659       || wi::cmpu (i_bound, wi::to_widest (loop->nb_iterations)) >= 0
2660       /* And undefined behavior happens unconditionally.  */
2661       || !dominated_by_p (CDI_DOMINATORS, loop->latch, gimple_bb (stmt)))
2662     return;
2663
2664   edge e = single_exit (loop);
2665   if (e == NULL)
2666     return;
2667
2668   gimple estmt = last_stmt (e->src);
2669   if (warning_at (gimple_location (stmt), OPT_Waggressive_loop_optimizations,
2670                   "iteration %E invokes undefined behavior",
2671                   wide_int_to_tree (TREE_TYPE (loop->nb_iterations),
2672                                     i_bound)))
2673     inform (gimple_location (estmt), "containing loop");
2674   loop->warned_aggressive_loop_optimizations = true;
2675 }
2676
2677 /* Records that AT_STMT is executed at most BOUND + 1 times in LOOP.  IS_EXIT
2678    is true if the loop is exited immediately after STMT, and this exit
2679    is taken at last when the STMT is executed BOUND + 1 times.
2680    REALISTIC is true if BOUND is expected to be close to the real number
2681    of iterations.  UPPER is true if we are sure the loop iterates at most
2682    BOUND times.  I_BOUND is a widest_int upper estimate on BOUND.  */
2683
2684 static void
2685 record_estimate (struct loop *loop, tree bound, const widest_int &i_bound,
2686                  gimple at_stmt, bool is_exit, bool realistic, bool upper)
2687 {
2688   widest_int delta;
2689
2690   if (dump_file && (dump_flags & TDF_DETAILS))
2691     {
2692       fprintf (dump_file, "Statement %s", is_exit ? "(exit)" : "");
2693       print_gimple_stmt (dump_file, at_stmt, 0, TDF_SLIM);
2694       fprintf (dump_file, " is %sexecuted at most ",
2695                upper ? "" : "probably ");
2696       print_generic_expr (dump_file, bound, TDF_SLIM);
2697       fprintf (dump_file, " (bounded by ");
2698       print_decu (i_bound, dump_file);
2699       fprintf (dump_file, ") + 1 times in loop %d.\n", loop->num);
2700     }
2701
2702   /* If the I_BOUND is just an estimate of BOUND, it rarely is close to the
2703      real number of iterations.  */
2704   if (TREE_CODE (bound) != INTEGER_CST)
2705     realistic = false;
2706   else
2707     gcc_checking_assert (i_bound == wi::to_widest (bound));
2708   if (!upper && !realistic)
2709     return;
2710
2711   /* If we have a guaranteed upper bound, record it in the appropriate
2712      list, unless this is an !is_exit bound (i.e. undefined behavior in
2713      at_stmt) in a loop with known constant number of iterations.  */
2714   if (upper
2715       && (is_exit
2716           || loop->nb_iterations == NULL_TREE
2717           || TREE_CODE (loop->nb_iterations) != INTEGER_CST))
2718     {
2719       struct nb_iter_bound *elt = ggc_alloc<nb_iter_bound> ();
2720
2721       elt->bound = i_bound;
2722       elt->stmt = at_stmt;
2723       elt->is_exit = is_exit;
2724       elt->next = loop->bounds;
2725       loop->bounds = elt;
2726     }
2727
2728   /* If statement is executed on every path to the loop latch, we can directly
2729      infer the upper bound on the # of iterations of the loop.  */
2730   if (!dominated_by_p (CDI_DOMINATORS, loop->latch, gimple_bb (at_stmt)))
2731     return;
2732
2733   /* Update the number of iteration estimates according to the bound.
2734      If at_stmt is an exit then the loop latch is executed at most BOUND times,
2735      otherwise it can be executed BOUND + 1 times.  We will lower the estimate
2736      later if such statement must be executed on last iteration  */
2737   if (is_exit)
2738     delta = 0;
2739   else
2740     delta = 1;
2741   widest_int new_i_bound = i_bound + delta;
2742
2743   /* If an overflow occurred, ignore the result.  */
2744   if (wi::ltu_p (new_i_bound, delta))
2745     return;
2746
2747   if (upper && !is_exit)
2748     do_warn_aggressive_loop_optimizations (loop, new_i_bound, at_stmt);
2749   record_niter_bound (loop, new_i_bound, realistic, upper);
2750 }
2751
2752 /* Records the control iv analyzed in NITER for LOOP if the iv is valid
2753    and doesn't overflow.  */
2754
2755 static void
2756 record_control_iv (struct loop *loop, struct tree_niter_desc *niter)
2757 {
2758   struct control_iv *iv;
2759
2760   if (!niter->control.base || !niter->control.step)
2761     return;
2762
2763   if (!integer_onep (niter->assumptions) || !niter->control.no_overflow)
2764     return;
2765
2766   iv = ggc_alloc<control_iv> ();
2767   iv->base = niter->control.base;
2768   iv->step = niter->control.step;
2769   iv->next = loop->control_ivs;
2770   loop->control_ivs = iv;
2771
2772   return;
2773 }
2774
2775 /* Record the estimate on number of iterations of LOOP based on the fact that
2776    the induction variable BASE + STEP * i evaluated in STMT does not wrap and
2777    its values belong to the range <LOW, HIGH>.  REALISTIC is true if the
2778    estimated number of iterations is expected to be close to the real one.
2779    UPPER is true if we are sure the induction variable does not wrap.  */
2780
2781 static void
2782 record_nonwrapping_iv (struct loop *loop, tree base, tree step, gimple stmt,
2783                        tree low, tree high, bool realistic, bool upper)
2784 {
2785   tree niter_bound, extreme, delta;
2786   tree type = TREE_TYPE (base), unsigned_type;
2787   tree orig_base = base;
2788
2789   if (TREE_CODE (step) != INTEGER_CST || integer_zerop (step))
2790     return;
2791
2792   if (dump_file && (dump_flags & TDF_DETAILS))
2793     {
2794       fprintf (dump_file, "Induction variable (");
2795       print_generic_expr (dump_file, TREE_TYPE (base), TDF_SLIM);
2796       fprintf (dump_file, ") ");
2797       print_generic_expr (dump_file, base, TDF_SLIM);
2798       fprintf (dump_file, " + ");
2799       print_generic_expr (dump_file, step, TDF_SLIM);
2800       fprintf (dump_file, " * iteration does not wrap in statement ");
2801       print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
2802       fprintf (dump_file, " in loop %d.\n", loop->num);
2803     }
2804
2805   unsigned_type = unsigned_type_for (type);
2806   base = fold_convert (unsigned_type, base);
2807   step = fold_convert (unsigned_type, step);
2808
2809   if (tree_int_cst_sign_bit (step))
2810     {
2811       wide_int min, max;
2812       extreme = fold_convert (unsigned_type, low);
2813       if (TREE_CODE (orig_base) == SSA_NAME
2814           && TREE_CODE (high) == INTEGER_CST
2815           && INTEGRAL_TYPE_P (TREE_TYPE (orig_base))
2816           && get_range_info (orig_base, &min, &max) == VR_RANGE
2817           && wi::gts_p (high, max))
2818         base = wide_int_to_tree (unsigned_type, max);
2819       else if (TREE_CODE (base) != INTEGER_CST)
2820         base = fold_convert (unsigned_type, high);
2821       delta = fold_build2 (MINUS_EXPR, unsigned_type, base, extreme);
2822       step = fold_build1 (NEGATE_EXPR, unsigned_type, step);
2823     }
2824   else
2825     {
2826       wide_int min, max;
2827       extreme = fold_convert (unsigned_type, high);
2828       if (TREE_CODE (orig_base) == SSA_NAME
2829           && TREE_CODE (low) == INTEGER_CST
2830           && INTEGRAL_TYPE_P (TREE_TYPE (orig_base))
2831           && get_range_info (orig_base, &min, &max) == VR_RANGE
2832           && wi::gts_p (min, low))
2833         base = wide_int_to_tree (unsigned_type, min);
2834       else if (TREE_CODE (base) != INTEGER_CST)
2835         base = fold_convert (unsigned_type, low);
2836       delta = fold_build2 (MINUS_EXPR, unsigned_type, extreme, base);
2837     }
2838
2839   /* STMT is executed at most NITER_BOUND + 1 times, since otherwise the value
2840      would get out of the range.  */
2841   niter_bound = fold_build2 (FLOOR_DIV_EXPR, unsigned_type, delta, step);
2842   widest_int max = derive_constant_upper_bound (niter_bound);
2843   record_estimate (loop, niter_bound, max, stmt, false, realistic, upper);
2844 }
2845
2846 /* Determine information about number of iterations a LOOP from the index
2847    IDX of a data reference accessed in STMT.  RELIABLE is true if STMT is
2848    guaranteed to be executed in every iteration of LOOP.  Callback for
2849    for_each_index.  */
2850
2851 struct ilb_data
2852 {
2853   struct loop *loop;
2854   gimple stmt;
2855 };
2856
2857 static bool
2858 idx_infer_loop_bounds (tree base, tree *idx, void *dta)
2859 {
2860   struct ilb_data *data = (struct ilb_data *) dta;
2861   tree ev, init, step;
2862   tree low, high, type, next;
2863   bool sign, upper = true, at_end = false;
2864   struct loop *loop = data->loop;
2865   bool reliable = true;
2866
2867   if (TREE_CODE (base) != ARRAY_REF)
2868     return true;
2869
2870   /* For arrays at the end of the structure, we are not guaranteed that they
2871      do not really extend over their declared size.  However, for arrays of
2872      size greater than one, this is unlikely to be intended.  */
2873   if (array_at_struct_end_p (base))
2874     {
2875       at_end = true;
2876       upper = false;
2877     }
2878
2879   struct loop *dloop = loop_containing_stmt (data->stmt);
2880   if (!dloop)
2881     return true;
2882
2883   ev = analyze_scalar_evolution (dloop, *idx);
2884   ev = instantiate_parameters (loop, ev);
2885   init = initial_condition (ev);
2886   step = evolution_part_in_loop_num (ev, loop->num);
2887
2888   if (!init
2889       || !step
2890       || TREE_CODE (step) != INTEGER_CST
2891       || integer_zerop (step)
2892       || tree_contains_chrecs (init, NULL)
2893       || chrec_contains_symbols_defined_in_loop (init, loop->num))
2894     return true;
2895
2896   low = array_ref_low_bound (base);
2897   high = array_ref_up_bound (base);
2898
2899   /* The case of nonconstant bounds could be handled, but it would be
2900      complicated.  */
2901   if (TREE_CODE (low) != INTEGER_CST
2902       || !high
2903       || TREE_CODE (high) != INTEGER_CST)
2904     return true;
2905   sign = tree_int_cst_sign_bit (step);
2906   type = TREE_TYPE (step);
2907
2908   /* The array of length 1 at the end of a structure most likely extends
2909      beyond its bounds.  */
2910   if (at_end
2911       && operand_equal_p (low, high, 0))
2912     return true;
2913
2914   /* In case the relevant bound of the array does not fit in type, or
2915      it does, but bound + step (in type) still belongs into the range of the
2916      array, the index may wrap and still stay within the range of the array
2917      (consider e.g. if the array is indexed by the full range of
2918      unsigned char).
2919
2920      To make things simpler, we require both bounds to fit into type, although
2921      there are cases where this would not be strictly necessary.  */
2922   if (!int_fits_type_p (high, type)
2923       || !int_fits_type_p (low, type))
2924     return true;
2925   low = fold_convert (type, low);
2926   high = fold_convert (type, high);
2927
2928   if (sign)
2929     next = fold_binary (PLUS_EXPR, type, low, step);
2930   else
2931     next = fold_binary (PLUS_EXPR, type, high, step);
2932
2933   if (tree_int_cst_compare (low, next) <= 0
2934       && tree_int_cst_compare (next, high) <= 0)
2935     return true;
2936
2937   /* If access is not executed on every iteration, we must ensure that overlow may
2938      not make the access valid later.  */
2939   if (!dominated_by_p (CDI_DOMINATORS, loop->latch, gimple_bb (data->stmt))
2940       && scev_probably_wraps_p (initial_condition_in_loop_num (ev, loop->num),
2941                                 step, data->stmt, loop, true))
2942     reliable = false;
2943
2944   record_nonwrapping_iv (loop, init, step, data->stmt, low, high, reliable, upper);
2945   return true;
2946 }
2947
2948 /* Determine information about number of iterations a LOOP from the bounds
2949    of arrays in the data reference REF accessed in STMT.  RELIABLE is true if
2950    STMT is guaranteed to be executed in every iteration of LOOP.*/
2951
2952 static void
2953 infer_loop_bounds_from_ref (struct loop *loop, gimple stmt, tree ref)
2954 {
2955   struct ilb_data data;
2956
2957   data.loop = loop;
2958   data.stmt = stmt;
2959   for_each_index (&ref, idx_infer_loop_bounds, &data);
2960 }
2961
2962 /* Determine information about number of iterations of a LOOP from the way
2963    arrays are used in STMT.  RELIABLE is true if STMT is guaranteed to be
2964    executed in every iteration of LOOP.  */
2965
2966 static void
2967 infer_loop_bounds_from_array (struct loop *loop, gimple stmt)
2968 {
2969   if (is_gimple_assign (stmt))
2970     {
2971       tree op0 = gimple_assign_lhs (stmt);
2972       tree op1 = gimple_assign_rhs1 (stmt);
2973
2974       /* For each memory access, analyze its access function
2975          and record a bound on the loop iteration domain.  */
2976       if (REFERENCE_CLASS_P (op0))
2977         infer_loop_bounds_from_ref (loop, stmt, op0);
2978
2979       if (REFERENCE_CLASS_P (op1))
2980         infer_loop_bounds_from_ref (loop, stmt, op1);
2981     }
2982   else if (is_gimple_call (stmt))
2983     {
2984       tree arg, lhs;
2985       unsigned i, n = gimple_call_num_args (stmt);
2986
2987       lhs = gimple_call_lhs (stmt);
2988       if (lhs && REFERENCE_CLASS_P (lhs))
2989         infer_loop_bounds_from_ref (loop, stmt, lhs);
2990
2991       for (i = 0; i < n; i++)
2992         {
2993           arg = gimple_call_arg (stmt, i);
2994           if (REFERENCE_CLASS_P (arg))
2995             infer_loop_bounds_from_ref (loop, stmt, arg);
2996         }
2997     }
2998 }
2999
3000 /* Determine information about number of iterations of a LOOP from the fact
3001    that pointer arithmetics in STMT does not overflow.  */
3002
3003 static void
3004 infer_loop_bounds_from_pointer_arith (struct loop *loop, gimple stmt)
3005 {
3006   tree def, base, step, scev, type, low, high;
3007   tree var, ptr;
3008
3009   if (!is_gimple_assign (stmt)
3010       || gimple_assign_rhs_code (stmt) != POINTER_PLUS_EXPR)
3011     return;
3012
3013   def = gimple_assign_lhs (stmt);
3014   if (TREE_CODE (def) != SSA_NAME)
3015     return;
3016
3017   type = TREE_TYPE (def);
3018   if (!nowrap_type_p (type))
3019     return;
3020
3021   ptr = gimple_assign_rhs1 (stmt);
3022   if (!expr_invariant_in_loop_p (loop, ptr))
3023     return;
3024
3025   var = gimple_assign_rhs2 (stmt);
3026   if (TYPE_PRECISION (type) != TYPE_PRECISION (TREE_TYPE (var)))
3027     return;
3028
3029   scev = instantiate_parameters (loop, analyze_scalar_evolution (loop, def));
3030   if (chrec_contains_undetermined (scev))
3031     return;
3032
3033   base = initial_condition_in_loop_num (scev, loop->num);
3034   step = evolution_part_in_loop_num (scev, loop->num);
3035
3036   if (!base || !step
3037       || TREE_CODE (step) != INTEGER_CST
3038       || tree_contains_chrecs (base, NULL)
3039       || chrec_contains_symbols_defined_in_loop (base, loop->num))
3040     return;
3041
3042   low = lower_bound_in_type (type, type);
3043   high = upper_bound_in_type (type, type);
3044
3045   /* In C, pointer arithmetic p + 1 cannot use a NULL pointer, and p - 1 cannot
3046      produce a NULL pointer.  The contrary would mean NULL points to an object,
3047      while NULL is supposed to compare unequal with the address of all objects.
3048      Furthermore, p + 1 cannot produce a NULL pointer and p - 1 cannot use a
3049      NULL pointer since that would mean wrapping, which we assume here not to
3050      happen.  So, we can exclude NULL from the valid range of pointer
3051      arithmetic.  */
3052   if (flag_delete_null_pointer_checks && int_cst_value (low) == 0)
3053     low = build_int_cstu (TREE_TYPE (low), TYPE_ALIGN_UNIT (TREE_TYPE (type)));
3054
3055   record_nonwrapping_iv (loop, base, step, stmt, low, high, false, true);
3056 }
3057
3058 /* Determine information about number of iterations of a LOOP from the fact
3059    that signed arithmetics in STMT does not overflow.  */
3060
3061 static void
3062 infer_loop_bounds_from_signedness (struct loop *loop, gimple stmt)
3063 {
3064   tree def, base, step, scev, type, low, high;
3065
3066   if (gimple_code (stmt) != GIMPLE_ASSIGN)
3067     return;
3068
3069   def = gimple_assign_lhs (stmt);
3070
3071   if (TREE_CODE (def) != SSA_NAME)
3072     return;
3073
3074   type = TREE_TYPE (def);
3075   if (!INTEGRAL_TYPE_P (type)
3076       || !TYPE_OVERFLOW_UNDEFINED (type))
3077     return;
3078
3079   scev = instantiate_parameters (loop, analyze_scalar_evolution (loop, def));
3080   if (chrec_contains_undetermined (scev))
3081     return;
3082
3083   base = initial_condition_in_loop_num (scev, loop->num);
3084   step = evolution_part_in_loop_num (scev, loop->num);
3085
3086   if (!base || !step
3087       || TREE_CODE (step) != INTEGER_CST
3088       || tree_contains_chrecs (base, NULL)
3089       || chrec_contains_symbols_defined_in_loop (base, loop->num))
3090     return;
3091
3092   low = lower_bound_in_type (type, type);
3093   high = upper_bound_in_type (type, type);
3094
3095   record_nonwrapping_iv (loop, base, step, stmt, low, high, false, true);
3096 }
3097
3098 /* The following analyzers are extracting informations on the bounds
3099    of LOOP from the following undefined behaviors:
3100
3101    - data references should not access elements over the statically
3102      allocated size,
3103
3104    - signed variables should not overflow when flag_wrapv is not set.
3105 */
3106
3107 static void
3108 infer_loop_bounds_from_undefined (struct loop *loop)
3109 {
3110   unsigned i;
3111   basic_block *bbs;
3112   gimple_stmt_iterator bsi;
3113   basic_block bb;
3114   bool reliable;
3115
3116   bbs = get_loop_body (loop);
3117
3118   for (i = 0; i < loop->num_nodes; i++)
3119     {
3120       bb = bbs[i];
3121
3122       /* If BB is not executed in each iteration of the loop, we cannot
3123          use the operations in it to infer reliable upper bound on the
3124          # of iterations of the loop.  However, we can use it as a guess.
3125          Reliable guesses come only from array bounds.  */
3126       reliable = dominated_by_p (CDI_DOMINATORS, loop->latch, bb);
3127
3128       for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
3129         {
3130           gimple stmt = gsi_stmt (bsi);
3131
3132           infer_loop_bounds_from_array (loop, stmt);
3133
3134           if (reliable)
3135             {
3136               infer_loop_bounds_from_signedness (loop, stmt);
3137               infer_loop_bounds_from_pointer_arith (loop, stmt);
3138             }
3139         }
3140
3141     }
3142
3143   free (bbs);
3144 }
3145
3146 /* Compare wide ints, callback for qsort.  */
3147
3148 static int
3149 wide_int_cmp (const void *p1, const void *p2)
3150 {
3151   const widest_int *d1 = (const widest_int *) p1;
3152   const widest_int *d2 = (const widest_int *) p2;
3153   return wi::cmpu (*d1, *d2);
3154 }
3155
3156 /* Return index of BOUND in BOUNDS array sorted in increasing order.
3157    Lookup by binary search.  */
3158
3159 static int
3160 bound_index (vec<widest_int> bounds, const widest_int &bound)
3161 {
3162   unsigned int end = bounds.length ();
3163   unsigned int begin = 0;
3164
3165   /* Find a matching index by means of a binary search.  */
3166   while (begin != end)
3167     {
3168       unsigned int middle = (begin + end) / 2;
3169       widest_int index = bounds[middle];
3170
3171       if (index == bound)
3172         return middle;
3173       else if (wi::ltu_p (index, bound))
3174         begin = middle + 1;
3175       else
3176         end = middle;
3177     }
3178   gcc_unreachable ();
3179 }
3180
3181 /* We recorded loop bounds only for statements dominating loop latch (and thus
3182    executed each loop iteration).  If there are any bounds on statements not
3183    dominating the loop latch we can improve the estimate by walking the loop
3184    body and seeing if every path from loop header to loop latch contains
3185    some bounded statement.  */
3186
3187 static void
3188 discover_iteration_bound_by_body_walk (struct loop *loop)
3189 {
3190   struct nb_iter_bound *elt;
3191   vec<widest_int> bounds = vNULL;
3192   vec<vec<basic_block> > queues = vNULL;
3193   vec<basic_block> queue = vNULL;
3194   ptrdiff_t queue_index;
3195   ptrdiff_t latch_index = 0;
3196
3197   /* Discover what bounds may interest us.  */
3198   for (elt = loop->bounds; elt; elt = elt->next)
3199     {
3200       widest_int bound = elt->bound;
3201
3202       /* Exit terminates loop at given iteration, while non-exits produce undefined
3203          effect on the next iteration.  */
3204       if (!elt->is_exit)
3205         {
3206           bound += 1;
3207           /* If an overflow occurred, ignore the result.  */
3208           if (bound == 0)
3209             continue;
3210         }
3211
3212       if (!loop->any_upper_bound
3213           || wi::ltu_p (bound, loop->nb_iterations_upper_bound))
3214         bounds.safe_push (bound);
3215     }
3216
3217   /* Exit early if there is nothing to do.  */
3218   if (!bounds.exists ())
3219     return;
3220
3221   if (dump_file && (dump_flags & TDF_DETAILS))
3222     fprintf (dump_file, " Trying to walk loop body to reduce the bound.\n");
3223
3224   /* Sort the bounds in decreasing order.  */
3225   bounds.qsort (wide_int_cmp);
3226
3227   /* For every basic block record the lowest bound that is guaranteed to
3228      terminate the loop.  */
3229
3230   hash_map<basic_block, ptrdiff_t> bb_bounds;
3231   for (elt = loop->bounds; elt; elt = elt->next)
3232     {
3233       widest_int bound = elt->bound;
3234       if (!elt->is_exit)
3235         {
3236           bound += 1;
3237           /* If an overflow occurred, ignore the result.  */
3238           if (bound == 0)
3239             continue;
3240         }
3241
3242       if (!loop->any_upper_bound
3243           || wi::ltu_p (bound, loop->nb_iterations_upper_bound))
3244         {
3245           ptrdiff_t index = bound_index (bounds, bound);
3246           ptrdiff_t *entry = bb_bounds.get (gimple_bb (elt->stmt));
3247           if (!entry)
3248             bb_bounds.put (gimple_bb (elt->stmt), index);
3249           else if ((ptrdiff_t)*entry > index)
3250             *entry = index;
3251         }
3252     }
3253
3254   hash_map<basic_block, ptrdiff_t> block_priority;
3255
3256   /* Perform shortest path discovery loop->header ... loop->latch.
3257
3258      The "distance" is given by the smallest loop bound of basic block
3259      present in the path and we look for path with largest smallest bound
3260      on it.
3261
3262      To avoid the need for fibonacci heap on double ints we simply compress
3263      double ints into indexes to BOUNDS array and then represent the queue
3264      as arrays of queues for every index.
3265      Index of BOUNDS.length() means that the execution of given BB has
3266      no bounds determined.
3267
3268      VISITED is a pointer map translating basic block into smallest index
3269      it was inserted into the priority queue with.  */
3270   latch_index = -1;
3271
3272   /* Start walk in loop header with index set to infinite bound.  */
3273   queue_index = bounds.length ();
3274   queues.safe_grow_cleared (queue_index + 1);
3275   queue.safe_push (loop->header);
3276   queues[queue_index] = queue;
3277   block_priority.put (loop->header, queue_index);
3278
3279   for (; queue_index >= 0; queue_index--)
3280     {
3281       if (latch_index < queue_index)
3282         {
3283           while (queues[queue_index].length ())
3284             {
3285               basic_block bb;
3286               ptrdiff_t bound_index = queue_index;
3287               edge e;
3288               edge_iterator ei;
3289
3290               queue = queues[queue_index];
3291               bb = queue.pop ();
3292
3293               /* OK, we later inserted the BB with lower priority, skip it.  */
3294               if (*block_priority.get (bb) > queue_index)
3295                 continue;
3296
3297               /* See if we can improve the bound.  */
3298               ptrdiff_t *entry = bb_bounds.get (bb);
3299               if (entry && *entry < bound_index)
3300                 bound_index = *entry;
3301
3302               /* Insert succesors into the queue, watch for latch edge
3303                  and record greatest index we saw.  */
3304               FOR_EACH_EDGE (e, ei, bb->succs)
3305                 {
3306                   bool insert = false;
3307
3308                   if (loop_exit_edge_p (loop, e))
3309                     continue;
3310
3311                   if (e == loop_latch_edge (loop)
3312                       && latch_index < bound_index)
3313                     latch_index = bound_index;
3314                   else if (!(entry = block_priority.get (e->dest)))
3315                     {
3316                       insert = true;
3317                       block_priority.put (e->dest, bound_index);
3318                     }
3319                   else if (*entry < bound_index)
3320                     {
3321                       insert = true;
3322                       *entry = bound_index;
3323                     }
3324
3325                   if (insert)
3326                     queues[bound_index].safe_push (e->dest);
3327                 }
3328             }
3329         }
3330       queues[queue_index].release ();
3331     }
3332
3333   gcc_assert (latch_index >= 0);
3334   if ((unsigned)latch_index < bounds.length ())
3335     {
3336       if (dump_file && (dump_flags & TDF_DETAILS))
3337         {
3338           fprintf (dump_file, "Found better loop bound ");
3339           print_decu (bounds[latch_index], dump_file);
3340           fprintf (dump_file, "\n");
3341         }
3342       record_niter_bound (loop, bounds[latch_index], false, true);
3343     }
3344
3345   queues.release ();
3346   bounds.release ();
3347 }
3348
3349 /* See if every path cross the loop goes through a statement that is known
3350    to not execute at the last iteration. In that case we can decrese iteration
3351    count by 1.  */
3352
3353 static void
3354 maybe_lower_iteration_bound (struct loop *loop)
3355 {
3356   hash_set<gimple> *not_executed_last_iteration = NULL;
3357   struct nb_iter_bound *elt;
3358   bool found_exit = false;
3359   vec<basic_block> queue = vNULL;
3360   bitmap visited;
3361
3362   /* Collect all statements with interesting (i.e. lower than
3363      nb_iterations_upper_bound) bound on them.
3364
3365      TODO: Due to the way record_estimate choose estimates to store, the bounds
3366      will be always nb_iterations_upper_bound-1.  We can change this to record
3367      also statements not dominating the loop latch and update the walk bellow
3368      to the shortest path algorthm.  */
3369   for (elt = loop->bounds; elt; elt = elt->next)
3370     {
3371       if (!elt->is_exit
3372           && wi::ltu_p (elt->bound, loop->nb_iterations_upper_bound))
3373         {
3374           if (!not_executed_last_iteration)
3375             not_executed_last_iteration = new hash_set<gimple>;
3376           not_executed_last_iteration->add (elt->stmt);
3377         }
3378     }
3379   if (!not_executed_last_iteration)
3380     return;
3381
3382   /* Start DFS walk in the loop header and see if we can reach the
3383      loop latch or any of the exits (including statements with side
3384      effects that may terminate the loop otherwise) without visiting
3385      any of the statements known to have undefined effect on the last
3386      iteration.  */
3387   queue.safe_push (loop->header);
3388   visited = BITMAP_ALLOC (NULL);
3389   bitmap_set_bit (visited, loop->header->index);
3390   found_exit = false;
3391
3392   do
3393     {
3394       basic_block bb = queue.pop ();
3395       gimple_stmt_iterator gsi;
3396       bool stmt_found = false;
3397
3398       /* Loop for possible exits and statements bounding the execution.  */
3399       for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
3400         {
3401           gimple stmt = gsi_stmt (gsi);
3402           if (not_executed_last_iteration->contains (stmt))
3403             {
3404               stmt_found = true;
3405               break;
3406             }
3407           if (gimple_has_side_effects (stmt))
3408             {
3409               found_exit = true;
3410               break;
3411             }
3412         }
3413       if (found_exit)
3414         break;
3415
3416       /* If no bounding statement is found, continue the walk.  */
3417       if (!stmt_found)
3418         {
3419           edge e;
3420           edge_iterator ei;
3421
3422           FOR_EACH_EDGE (e, ei, bb->succs)
3423             {
3424               if (loop_exit_edge_p (loop, e)
3425                   || e == loop_latch_edge (loop))
3426                 {
3427                   found_exit = true;
3428                   break;
3429                 }
3430               if (bitmap_set_bit (visited, e->dest->index))
3431                 queue.safe_push (e->dest);
3432             }
3433         }
3434     }
3435   while (queue.length () && !found_exit);
3436
3437   /* If every path through the loop reach bounding statement before exit,
3438      then we know the last iteration of the loop will have undefined effect
3439      and we can decrease number of iterations.  */
3440
3441   if (!found_exit)
3442     {
3443       if (dump_file && (dump_flags & TDF_DETAILS))
3444         fprintf (dump_file, "Reducing loop iteration estimate by 1; "
3445                  "undefined statement must be executed at the last iteration.\n");
3446       record_niter_bound (loop, loop->nb_iterations_upper_bound - 1,
3447                           false, true);
3448     }
3449
3450   BITMAP_FREE (visited);
3451   queue.release ();
3452   delete not_executed_last_iteration;
3453 }
3454
3455 /* Records estimates on numbers of iterations of LOOP.  If USE_UNDEFINED_P
3456    is true also use estimates derived from undefined behavior.  */
3457
3458 static void
3459 estimate_numbers_of_iterations_loop (struct loop *loop)
3460 {
3461   vec<edge> exits;
3462   tree niter, type;
3463   unsigned i;
3464   struct tree_niter_desc niter_desc;
3465   edge ex;
3466   widest_int bound;
3467   edge likely_exit;
3468
3469   /* Give up if we already have tried to compute an estimation.  */
3470   if (loop->estimate_state != EST_NOT_COMPUTED)
3471     return;
3472
3473   loop->estimate_state = EST_AVAILABLE;
3474   /* Force estimate compuation but leave any existing upper bound in place.  */
3475   loop->any_estimate = false;
3476
3477   /* Ensure that loop->nb_iterations is computed if possible.  If it turns out
3478      to be constant, we avoid undefined behavior implied bounds and instead
3479      diagnose those loops with -Waggressive-loop-optimizations.  */
3480   number_of_latch_executions (loop);
3481
3482   exits = get_loop_exit_edges (loop);
3483   likely_exit = single_likely_exit (loop);
3484   FOR_EACH_VEC_ELT (exits, i, ex)
3485     {
3486       if (!number_of_iterations_exit (loop, ex, &niter_desc, false, false))
3487         continue;
3488
3489       niter = niter_desc.niter;
3490       type = TREE_TYPE (niter);
3491       if (TREE_CODE (niter_desc.may_be_zero) != INTEGER_CST)
3492         niter = build3 (COND_EXPR, type, niter_desc.may_be_zero,
3493                         build_int_cst (type, 0),
3494                         niter);
3495       record_estimate (loop, niter, niter_desc.max,
3496                        last_stmt (ex->src),
3497                        true, ex == likely_exit, true);
3498       record_control_iv (loop, &niter_desc);
3499     }
3500   exits.release ();
3501
3502   if (flag_aggressive_loop_optimizations)
3503     infer_loop_bounds_from_undefined (loop);
3504
3505   discover_iteration_bound_by_body_walk (loop);
3506
3507   maybe_lower_iteration_bound (loop);
3508
3509   /* If we have a measured profile, use it to estimate the number of
3510      iterations.  */
3511   if (loop->header->count != 0)
3512     {
3513       gcov_type nit = expected_loop_iterations_unbounded (loop) + 1;
3514       bound = gcov_type_to_wide_int (nit);
3515       record_niter_bound (loop, bound, true, false);
3516     }
3517
3518   /* If we know the exact number of iterations of this loop, try to
3519      not break code with undefined behavior by not recording smaller
3520      maximum number of iterations.  */
3521   if (loop->nb_iterations
3522       && TREE_CODE (loop->nb_iterations) == INTEGER_CST)
3523     {
3524       loop->any_upper_bound = true;
3525       loop->nb_iterations_upper_bound = wi::to_widest (loop->nb_iterations);
3526     }
3527 }
3528
3529 /* Sets NIT to the estimated number of executions of the latch of the
3530    LOOP.  If CONSERVATIVE is true, we must be sure that NIT is at least as
3531    large as the number of iterations.  If we have no reliable estimate,
3532    the function returns false, otherwise returns true.  */
3533
3534 bool
3535 estimated_loop_iterations (struct loop *loop, widest_int *nit)
3536 {
3537   /* When SCEV information is available, try to update loop iterations
3538      estimate.  Otherwise just return whatever we recorded earlier.  */
3539   if (scev_initialized_p ())
3540     estimate_numbers_of_iterations_loop (loop);
3541
3542   return (get_estimated_loop_iterations (loop, nit));
3543 }
3544
3545 /* Similar to estimated_loop_iterations, but returns the estimate only
3546    if it fits to HOST_WIDE_INT.  If this is not the case, or the estimate
3547    on the number of iterations of LOOP could not be derived, returns -1.  */
3548
3549 HOST_WIDE_INT
3550 estimated_loop_iterations_int (struct loop *loop)
3551 {
3552   widest_int nit;
3553   HOST_WIDE_INT hwi_nit;
3554
3555   if (!estimated_loop_iterations (loop, &nit))
3556     return -1;
3557
3558   if (!wi::fits_shwi_p (nit))
3559     return -1;
3560   hwi_nit = nit.to_shwi ();
3561
3562   return hwi_nit < 0 ? -1 : hwi_nit;
3563 }
3564
3565
3566 /* Sets NIT to an upper bound for the maximum number of executions of the
3567    latch of the LOOP.  If we have no reliable estimate, the function returns
3568    false, otherwise returns true.  */
3569
3570 bool
3571 max_loop_iterations (struct loop *loop, widest_int *nit)
3572 {
3573   /* When SCEV information is available, try to update loop iterations
3574      estimate.  Otherwise just return whatever we recorded earlier.  */
3575   if (scev_initialized_p ())
3576     estimate_numbers_of_iterations_loop (loop);
3577
3578   return get_max_loop_iterations (loop, nit);
3579 }
3580
3581 /* Similar to max_loop_iterations, but returns the estimate only
3582    if it fits to HOST_WIDE_INT.  If this is not the case, or the estimate
3583    on the number of iterations of LOOP could not be derived, returns -1.  */
3584
3585 HOST_WIDE_INT
3586 max_loop_iterations_int (struct loop *loop)
3587 {
3588   widest_int nit;
3589   HOST_WIDE_INT hwi_nit;
3590
3591   if (!max_loop_iterations (loop, &nit))
3592     return -1;
3593
3594   if (!wi::fits_shwi_p (nit))
3595     return -1;
3596   hwi_nit = nit.to_shwi ();
3597
3598   return hwi_nit < 0 ? -1 : hwi_nit;
3599 }
3600
3601 /* Returns an estimate for the number of executions of statements
3602    in the LOOP.  For statements before the loop exit, this exceeds
3603    the number of execution of the latch by one.  */
3604
3605 HOST_WIDE_INT
3606 estimated_stmt_executions_int (struct loop *loop)
3607 {
3608   HOST_WIDE_INT nit = estimated_loop_iterations_int (loop);
3609   HOST_WIDE_INT snit;
3610
3611   if (nit == -1)
3612     return -1;
3613
3614   snit = (HOST_WIDE_INT) ((unsigned HOST_WIDE_INT) nit + 1);
3615
3616   /* If the computation overflows, return -1.  */
3617   return snit < 0 ? -1 : snit;
3618 }
3619
3620 /* Sets NIT to the estimated maximum number of executions of the latch of the
3621    LOOP, plus one.  If we have no reliable estimate, the function returns
3622    false, otherwise returns true.  */
3623
3624 bool
3625 max_stmt_executions (struct loop *loop, widest_int *nit)
3626 {
3627   widest_int nit_minus_one;
3628
3629   if (!max_loop_iterations (loop, nit))
3630     return false;
3631
3632   nit_minus_one = *nit;
3633
3634   *nit += 1;
3635
3636   return wi::gtu_p (*nit, nit_minus_one);
3637 }
3638
3639 /* Sets NIT to the estimated number of executions of the latch of the
3640    LOOP, plus one.  If we have no reliable estimate, the function returns
3641    false, otherwise returns true.  */
3642
3643 bool
3644 estimated_stmt_executions (struct loop *loop, widest_int *nit)
3645 {
3646   widest_int nit_minus_one;
3647
3648   if (!estimated_loop_iterations (loop, nit))
3649     return false;
3650
3651   nit_minus_one = *nit;
3652
3653   *nit += 1;
3654
3655   return wi::gtu_p (*nit, nit_minus_one);
3656 }
3657
3658 /* Records estimates on numbers of iterations of loops.  */
3659
3660 void
3661 estimate_numbers_of_iterations (void)
3662 {
3663   struct loop *loop;
3664
3665   /* We don't want to issue signed overflow warnings while getting
3666      loop iteration estimates.  */
3667   fold_defer_overflow_warnings ();
3668
3669   FOR_EACH_LOOP (loop, 0)
3670     {
3671       estimate_numbers_of_iterations_loop (loop);
3672     }
3673
3674   fold_undefer_and_ignore_overflow_warnings ();
3675 }
3676
3677 /* Returns true if statement S1 dominates statement S2.  */
3678
3679 bool
3680 stmt_dominates_stmt_p (gimple s1, gimple s2)
3681 {
3682   basic_block bb1 = gimple_bb (s1), bb2 = gimple_bb (s2);
3683
3684   if (!bb1
3685       || s1 == s2)
3686     return true;
3687
3688   if (bb1 == bb2)
3689     {
3690       gimple_stmt_iterator bsi;
3691
3692       if (gimple_code (s2) == GIMPLE_PHI)
3693         return false;
3694
3695       if (gimple_code (s1) == GIMPLE_PHI)
3696         return true;
3697
3698       for (bsi = gsi_start_bb (bb1); gsi_stmt (bsi) != s2; gsi_next (&bsi))
3699         if (gsi_stmt (bsi) == s1)
3700           return true;
3701
3702       return false;
3703     }
3704
3705   return dominated_by_p (CDI_DOMINATORS, bb2, bb1);
3706 }
3707
3708 /* Returns true when we can prove that the number of executions of
3709    STMT in the loop is at most NITER, according to the bound on
3710    the number of executions of the statement NITER_BOUND->stmt recorded in
3711    NITER_BOUND and fact that NITER_BOUND->stmt dominate STMT.
3712
3713    ??? This code can become quite a CPU hog - we can have many bounds,
3714    and large basic block forcing stmt_dominates_stmt_p to be queried
3715    many times on a large basic blocks, so the whole thing is O(n^2)
3716    for scev_probably_wraps_p invocation (that can be done n times).
3717
3718    It would make more sense (and give better answers) to remember BB
3719    bounds computed by discover_iteration_bound_by_body_walk.  */
3720
3721 static bool
3722 n_of_executions_at_most (gimple stmt,
3723                          struct nb_iter_bound *niter_bound,
3724                          tree niter)
3725 {
3726   widest_int bound = niter_bound->bound;
3727   tree nit_type = TREE_TYPE (niter), e;
3728   enum tree_code cmp;
3729
3730   gcc_assert (TYPE_UNSIGNED (nit_type));
3731
3732   /* If the bound does not even fit into NIT_TYPE, it cannot tell us that
3733      the number of iterations is small.  */
3734   if (!wi::fits_to_tree_p (bound, nit_type))
3735     return false;
3736
3737   /* We know that NITER_BOUND->stmt is executed at most NITER_BOUND->bound + 1
3738      times.  This means that:
3739
3740      -- if NITER_BOUND->is_exit is true, then everything after
3741         it at most NITER_BOUND->bound times.
3742
3743      -- If NITER_BOUND->is_exit is false, then if we can prove that when STMT
3744         is executed, then NITER_BOUND->stmt is executed as well in the same
3745         iteration then STMT is executed at most NITER_BOUND->bound + 1 times.
3746
3747         If we can determine that NITER_BOUND->stmt is always executed
3748         after STMT, then STMT is executed at most NITER_BOUND->bound + 2 times.
3749         We conclude that if both statements belong to the same
3750         basic block and STMT is before NITER_BOUND->stmt and there are no
3751         statements with side effects in between.  */
3752
3753   if (niter_bound->is_exit)
3754     {
3755       if (stmt == niter_bound->stmt
3756           || !stmt_dominates_stmt_p (niter_bound->stmt, stmt))
3757         return false;
3758       cmp = GE_EXPR;
3759     }
3760   else
3761     {
3762       if (!stmt_dominates_stmt_p (niter_bound->stmt, stmt))
3763         {
3764           gimple_stmt_iterator bsi;
3765           if (gimple_bb (stmt) != gimple_bb (niter_bound->stmt)
3766               || gimple_code (stmt) == GIMPLE_PHI
3767               || gimple_code (niter_bound->stmt) == GIMPLE_PHI)
3768             return false;
3769
3770           /* By stmt_dominates_stmt_p we already know that STMT appears
3771              before NITER_BOUND->STMT.  Still need to test that the loop
3772              can not be terinated by a side effect in between.  */
3773           for (bsi = gsi_for_stmt (stmt); gsi_stmt (bsi) != niter_bound->stmt;
3774                gsi_next (&bsi))
3775             if (gimple_has_side_effects (gsi_stmt (bsi)))
3776                return false;
3777           bound += 1;
3778           if (bound == 0
3779               || !wi::fits_to_tree_p (bound, nit_type))
3780             return false;
3781         }
3782       cmp = GT_EXPR;
3783     }
3784
3785   e = fold_binary (cmp, boolean_type_node,
3786                    niter, wide_int_to_tree (nit_type, bound));
3787   return e && integer_nonzerop (e);
3788 }
3789
3790 /* Returns true if the arithmetics in TYPE can be assumed not to wrap.  */
3791
3792 bool
3793 nowrap_type_p (tree type)
3794 {
3795   if (INTEGRAL_TYPE_P (type)
3796       && TYPE_OVERFLOW_UNDEFINED (type))
3797     return true;
3798
3799   if (POINTER_TYPE_P (type))
3800     return true;
3801
3802   return false;
3803 }
3804
3805 /* Return true if we can prove LOOP is exited before evolution of induction
3806    variabled {BASE, STEP} overflows with respect to its type bound.  */
3807
3808 static bool
3809 loop_exits_before_overflow (tree base, tree step,
3810                             gimple at_stmt, struct loop *loop)
3811 {
3812   widest_int niter;
3813   struct control_iv *civ;
3814   struct nb_iter_bound *bound;
3815   tree e, delta, step_abs, unsigned_base;
3816   tree type = TREE_TYPE (step);
3817   tree unsigned_type, valid_niter;
3818
3819   /* Don't issue signed overflow warnings.  */
3820   fold_defer_overflow_warnings ();
3821
3822   /* Compute the number of iterations before we reach the bound of the
3823      type, and verify that the loop is exited before this occurs.  */
3824   unsigned_type = unsigned_type_for (type);
3825   unsigned_base = fold_convert (unsigned_type, base);
3826
3827   if (tree_int_cst_sign_bit (step))
3828     {
3829       tree extreme = fold_convert (unsigned_type,
3830                                    lower_bound_in_type (type, type));
3831       delta = fold_build2 (MINUS_EXPR, unsigned_type, unsigned_base, extreme);
3832       step_abs = fold_build1 (NEGATE_EXPR, unsigned_type,
3833                               fold_convert (unsigned_type, step));
3834     }
3835   else
3836     {
3837       tree extreme = fold_convert (unsigned_type,
3838                                    upper_bound_in_type (type, type));
3839       delta = fold_build2 (MINUS_EXPR, unsigned_type, extreme, unsigned_base);
3840       step_abs = fold_convert (unsigned_type, step);
3841     }
3842
3843   valid_niter = fold_build2 (FLOOR_DIV_EXPR, unsigned_type, delta, step_abs);
3844
3845   estimate_numbers_of_iterations_loop (loop);
3846
3847   if (max_loop_iterations (loop, &niter)
3848       && wi::fits_to_tree_p (niter, TREE_TYPE (valid_niter))
3849       && (e = fold_binary (GT_EXPR, boolean_type_node, valid_niter,
3850                            wide_int_to_tree (TREE_TYPE (valid_niter),
3851                                              niter))) != NULL
3852       && integer_nonzerop (e))
3853     {
3854       fold_undefer_and_ignore_overflow_warnings ();
3855       return true;
3856     }
3857   if (at_stmt)
3858     for (bound = loop->bounds; bound; bound = bound->next)
3859       {
3860         if (n_of_executions_at_most (at_stmt, bound, valid_niter))
3861           {
3862             fold_undefer_and_ignore_overflow_warnings ();
3863             return true;
3864           }
3865       }
3866   fold_undefer_and_ignore_overflow_warnings ();
3867
3868   /* Try to prove loop is exited before {base, step} overflows with the
3869      help of analyzed loop control IV.  This is done only for IVs with
3870      constant step because otherwise we don't have the information.  */
3871   if (TREE_CODE (step) == INTEGER_CST)
3872     for (civ = loop->control_ivs; civ; civ = civ->next)
3873       {
3874         enum tree_code code;
3875         tree stepped, extreme, civ_type = TREE_TYPE (civ->step);
3876
3877         /* Have to consider type difference because operand_equal_p ignores
3878            that for constants.  */
3879         if (TYPE_UNSIGNED (type) != TYPE_UNSIGNED (civ_type)
3880             || element_precision (type) != element_precision (civ_type))
3881           continue;
3882
3883         /* Only consider control IV with same step.  */
3884         if (!operand_equal_p (step, civ->step, 0))
3885           continue;
3886
3887         /* Done proving if this is a no-overflow control IV.  */
3888         if (operand_equal_p (base, civ->base, 0))
3889           return true;
3890
3891         /* If this is a before stepping control IV, in other words, we have
3892
3893              {civ_base, step} = {base + step, step}
3894
3895            Because civ {base + step, step} doesn't overflow during loop
3896            iterations, {base, step} will not overflow if we can prove the
3897            operation "base + step" does not overflow.  Specifically, we try
3898            to prove below conditions are satisfied:
3899
3900              base <= UPPER_BOUND (type) - step  ;;step > 0
3901              base >= LOWER_BOUND (type) - step  ;;step < 0
3902
3903            by proving the reverse conditions are false using loop's initial
3904            condition.  */
3905         stepped = fold_build2 (PLUS_EXPR, TREE_TYPE (base), base, step);
3906         if (operand_equal_p (stepped, civ->base, 0))
3907           {
3908             if (tree_int_cst_sign_bit (step))
3909               {
3910                 code = LT_EXPR;
3911                 extreme = lower_bound_in_type (type, type);
3912               }
3913             else
3914               {
3915                 code = GT_EXPR;
3916                 extreme = upper_bound_in_type (type, type);
3917               }
3918             extreme = fold_build2 (MINUS_EXPR, type, extreme, step);
3919             e = fold_build2 (code, boolean_type_node, base, extreme);
3920             e = simplify_using_initial_conditions (loop, e);
3921             if (integer_zerop (e))
3922               return true;
3923
3924             continue;
3925           }
3926
3927         /* Similar to above, only in this case we have:
3928
3929              {civ_base, step} = {(signed T)((unsigned T)base + step), step}
3930              && TREE_TYPE (civ_base) = signed T.
3931
3932            We prove that below condition is satisfied:
3933
3934              (signed T)((unsigned T)base + step)
3935                == (signed T)(unsigned T)base + step
3936                == base + step
3937
3938            because of exact the same reason as above.  This also proves
3939            there is no overflow in the operation "base + step", thus the
3940            induction variable {base, step} during loop iterations.
3941
3942            This is necessary to handle cases as below:
3943
3944              int foo (int *a, signed char s, signed char l)
3945                {
3946                  signed char i;
3947                  for (i = s; i < l; i++)
3948                    a[i] = 0;
3949                  return 0;
3950                }
3951
3952            The variable I is firstly converted to type unsigned char,
3953            incremented, then converted back to type signed char.  */
3954         if (!CONVERT_EXPR_P (civ->base) || TREE_TYPE (civ->base) != type)
3955           continue;
3956         e = TREE_OPERAND (civ->base, 0);
3957         if (TREE_CODE (e) != PLUS_EXPR
3958             || TREE_CODE (TREE_OPERAND (e, 1)) != INTEGER_CST
3959             || !operand_equal_p (step,
3960                                  fold_convert (type,
3961                                                TREE_OPERAND (e, 1)), 0))
3962           continue;
3963         e = TREE_OPERAND (e, 0);
3964         if (!CONVERT_EXPR_P (e) || !operand_equal_p (e, unsigned_base, 0))
3965           continue;
3966         e = TREE_OPERAND (e, 0);
3967         gcc_assert (operand_equal_p (e, base, 0));
3968         if (tree_int_cst_sign_bit (step))
3969           {
3970             code = LT_EXPR;
3971             extreme = lower_bound_in_type (type, type);
3972           }
3973         else
3974           {
3975             code = GT_EXPR;
3976             extreme = upper_bound_in_type (type, type);
3977           }
3978         extreme = fold_build2 (MINUS_EXPR, type, extreme, step);
3979         e = fold_build2 (code, boolean_type_node, base, extreme);
3980         e = simplify_using_initial_conditions (loop, e);
3981         if (integer_zerop (e))
3982           return true;
3983       }
3984
3985   return false;
3986 }
3987
3988 /* Return false only when the induction variable BASE + STEP * I is
3989    known to not overflow: i.e. when the number of iterations is small
3990    enough with respect to the step and initial condition in order to
3991    keep the evolution confined in TYPEs bounds.  Return true when the
3992    iv is known to overflow or when the property is not computable.
3993
3994    USE_OVERFLOW_SEMANTICS is true if this function should assume that
3995    the rules for overflow of the given language apply (e.g., that signed
3996    arithmetics in C does not overflow).  */
3997
3998 bool
3999 scev_probably_wraps_p (tree base, tree step,
4000                        gimple at_stmt, struct loop *loop,
4001                        bool use_overflow_semantics)
4002 {
4003   /* FIXME: We really need something like
4004      http://gcc.gnu.org/ml/gcc-patches/2005-06/msg02025.html.
4005
4006      We used to test for the following situation that frequently appears
4007      during address arithmetics:
4008
4009        D.1621_13 = (long unsigned intD.4) D.1620_12;
4010        D.1622_14 = D.1621_13 * 8;
4011        D.1623_15 = (doubleD.29 *) D.1622_14;
4012
4013      And derived that the sequence corresponding to D_14
4014      can be proved to not wrap because it is used for computing a
4015      memory access; however, this is not really the case -- for example,
4016      if D_12 = (unsigned char) [254,+,1], then D_14 has values
4017      2032, 2040, 0, 8, ..., but the code is still legal.  */
4018
4019   if (chrec_contains_undetermined (base)
4020       || chrec_contains_undetermined (step))
4021     return true;
4022
4023   if (integer_zerop (step))
4024     return false;
4025
4026   /* If we can use the fact that signed and pointer arithmetics does not
4027      wrap, we are done.  */
4028   if (use_overflow_semantics && nowrap_type_p (TREE_TYPE (base)))
4029     return false;
4030
4031   /* To be able to use estimates on number of iterations of the loop,
4032      we must have an upper bound on the absolute value of the step.  */
4033   if (TREE_CODE (step) != INTEGER_CST)
4034     return true;
4035
4036   if (loop_exits_before_overflow (base, step, at_stmt, loop))
4037     return false;
4038
4039   /* At this point we still don't have a proof that the iv does not
4040      overflow: give up.  */
4041   return true;
4042 }
4043
4044 /* Frees the information on upper bounds on numbers of iterations of LOOP.  */
4045
4046 void
4047 free_numbers_of_iterations_estimates_loop (struct loop *loop)
4048 {
4049   struct control_iv *civ;
4050   struct nb_iter_bound *bound;
4051
4052   loop->nb_iterations = NULL;
4053   loop->estimate_state = EST_NOT_COMPUTED;
4054   for (bound = loop->bounds; bound;)
4055     {
4056       struct nb_iter_bound *next = bound->next;
4057       ggc_free (bound);
4058       bound = next;
4059     }
4060   loop->bounds = NULL;
4061
4062   for (civ = loop->control_ivs; civ;)
4063     {
4064       struct control_iv *next = civ->next;
4065       ggc_free (civ);
4066       civ = next;
4067     }
4068   loop->control_ivs = NULL;
4069 }
4070
4071 /* Frees the information on upper bounds on numbers of iterations of loops.  */
4072
4073 void
4074 free_numbers_of_iterations_estimates (void)
4075 {
4076   struct loop *loop;
4077
4078   FOR_EACH_LOOP (loop, 0)
4079     {
4080       free_numbers_of_iterations_estimates_loop (loop);
4081     }
4082 }
4083
4084 /* Substitute value VAL for ssa name NAME inside expressions held
4085    at LOOP.  */
4086
4087 void
4088 substitute_in_loop_info (struct loop *loop, tree name, tree val)
4089 {
4090   loop->nb_iterations = simplify_replace_tree (loop->nb_iterations, name, val);
4091 }