gcc/loop-iv.c

   1 /* Rtl-level induction variable analysis.
   2    Copyright (C) 2004-2015 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the
   8 Free Software Foundation; either version 3, or (at your option) any
   9 later version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT
  12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 /* This is a simple analysis of induction variables of the loop.  The major use
  21    is for determining the number of iterations of a loop for loop unrolling,
  22    doloop optimization and branch prediction.  The iv information is computed
  23    on demand.
  24
  25    Induction variables are analyzed by walking the use-def chains.  When
  26    a basic induction variable (biv) is found, it is cached in the bivs
  27    hash table.  When register is proved to be a biv, its description
  28    is stored to DF_REF_DATA of the def reference.
  29
  30    The analysis works always with one loop -- you must call
  31    iv_analysis_loop_init (loop) for it.  All the other functions then work with
  32    this loop.   When you need to work with another loop, just call
  33    iv_analysis_loop_init for it.  When you no longer need iv analysis, call
  34    iv_analysis_done () to clean up the memory.
  35
  36    The available functions are:
  37
  38    iv_analyze (insn, reg, iv): Stores the description of the induction variable
  39      corresponding to the use of register REG in INSN to IV.  Returns true if
  40      REG is an induction variable in INSN. false otherwise.
  41      If use of REG is not found in INSN, following insns are scanned (so that
  42      we may call this function on insn returned by get_condition).
  43    iv_analyze_result (insn, def, iv):  Stores to IV the description of the iv
  44      corresponding to DEF, which is a register defined in INSN.
  45    iv_analyze_expr (insn, rhs, mode, iv):  Stores to IV the description of iv
  46      corresponding to expression EXPR evaluated at INSN.  All registers used bu
  47      EXPR must also be used in INSN.
  48 */
  49
  50 #include "config.h"
  51 #include "system.h"
  52 #include "coretypes.h"
  53 #include "backend.h"
  54 #include "tree.h"
  55 #include "rtl.h"
  56 #include "df.h"
  57 #include "obstack.h"
  58 #include "cfgloop.h"
  59 #include "flags.h"
  60 #include "alias.h"
  61 #include "insn-config.h"
  62 #include "expmed.h"
  63 #include "dojump.h"
  64 #include "explow.h"
  65 #include "calls.h"
  66 #include "emit-rtl.h"
  67 #include "varasm.h"
  68 #include "stmt.h"
  69 #include "expr.h"
  70 #include "intl.h"
  71 #include "diagnostic-core.h"
  72 #include "dumpfile.h"
  73 #include "rtl-iter.h"
  74
  75 /* Possible return values of iv_get_reaching_def.  */
  76
  77 enum iv_grd_result
  78 {
  79   /* More than one reaching def, or reaching def that does not
  80      dominate the use.  */
  81   GRD_INVALID,
  82
  83   /* The use is trivial invariant of the loop, i.e. is not changed
  84      inside the loop.  */
  85   GRD_INVARIANT,
  86
  87   /* The use is reached by initial value and a value from the
  88      previous iteration.  */
  89   GRD_MAYBE_BIV,
  90
  91   /* The use has single dominating def.  */
  92   GRD_SINGLE_DOM
  93 };
  94
  95 /* Information about a biv.  */
  96
  97 struct biv_entry
  98 {
  99   unsigned regno;       /* The register of the biv.  */
 100   struct rtx_iv iv;     /* Value of the biv.  */
 101 };
 102
 103 static bool clean_slate = true;
 104
 105 static unsigned int iv_ref_table_size = 0;
 106
 107 /* Table of rtx_ivs indexed by the df_ref uid field.  */
 108 static struct rtx_iv ** iv_ref_table;
 109
 110 /* Induction variable stored at the reference.  */
 111 #define DF_REF_IV(REF) iv_ref_table[DF_REF_ID (REF)]
 112 #define DF_REF_IV_SET(REF, IV) iv_ref_table[DF_REF_ID (REF)] = (IV)
 113
 114 /* The current loop.  */
 115
 116 static struct loop *current_loop;
 117
 118 /* Hashtable helper.  */
 119
 120 struct biv_entry_hasher : free_ptr_hash <biv_entry>
 121 {
 122   typedef rtx_def *compare_type;
 123   static inline hashval_t hash (const biv_entry *);
 124   static inline bool equal (const biv_entry *, const rtx_def *);
 125 };
 126
 127 /* Returns hash value for biv B.  */
 128
 129 inline hashval_t
 130 biv_entry_hasher::hash (const biv_entry *b)
 131 {
 132   return b->regno;
 133 }
 134
 135 /* Compares biv B and register R.  */
 136
 137 inline bool
 138 biv_entry_hasher::equal (const biv_entry *b, const rtx_def *r)
 139 {
 140   return b->regno == REGNO (r);
 141 }
 142
 143 /* Bivs of the current loop.  */
 144
 145 static hash_table<biv_entry_hasher> *bivs;
 146
 147 static bool iv_analyze_op (rtx_insn *, rtx, struct rtx_iv *);
 148
 149 /* Return the RTX code corresponding to the IV extend code EXTEND.  */
 150 static inline enum rtx_code
 151 iv_extend_to_rtx_code (enum iv_extend_code extend)
 152 {
 153   switch (extend)
 154     {
 155     case IV_SIGN_EXTEND:
 156       return SIGN_EXTEND;
 157     case IV_ZERO_EXTEND:
 158       return ZERO_EXTEND;
 159     case IV_UNKNOWN_EXTEND:
 160       return UNKNOWN;
 161     }
 162   gcc_unreachable ();
 163 }
 164
 165 /* Dumps information about IV to FILE.  */
 166
 167 extern void dump_iv_info (FILE *, struct rtx_iv *);
 168 void
 169 dump_iv_info (FILE *file, struct rtx_iv *iv)
 170 {
 171   if (!iv->base)
 172     {
 173       fprintf (file, "not simple");
 174       return;
 175     }
 176
 177   if (iv->step == const0_rtx
 178       && !iv->first_special)
 179     fprintf (file, "invariant ");
 180
 181   print_rtl (file, iv->base);
 182   if (iv->step != const0_rtx)
 183     {
 184       fprintf (file, " + ");
 185       print_rtl (file, iv->step);
 186       fprintf (file, " * iteration");
 187     }
 188   fprintf (file, " (in %s)", GET_MODE_NAME (iv->mode));
 189
 190   if (iv->mode != iv->extend_mode)
 191     fprintf (file, " %s to %s",
 192              rtx_name[iv_extend_to_rtx_code (iv->extend)],
 193              GET_MODE_NAME (iv->extend_mode));
 194
 195   if (iv->mult != const1_rtx)
 196     {
 197       fprintf (file, " * ");
 198       print_rtl (file, iv->mult);
 199     }
 200   if (iv->delta != const0_rtx)
 201     {
 202       fprintf (file, " + ");
 203       print_rtl (file, iv->delta);
 204     }
 205   if (iv->first_special)
 206     fprintf (file, " (first special)");
 207 }
 208
 209 /* Generates a subreg to get the least significant part of EXPR (in mode
 210    INNER_MODE) to OUTER_MODE.  */
 211
 212 rtx
 213 lowpart_subreg (machine_mode outer_mode, rtx expr,
 214                 machine_mode inner_mode)
 215 {
 216   return simplify_gen_subreg (outer_mode, expr, inner_mode,
 217                               subreg_lowpart_offset (outer_mode, inner_mode));
 218 }
 219
 220 static void
 221 check_iv_ref_table_size (void)
 222 {
 223   if (iv_ref_table_size < DF_DEFS_TABLE_SIZE ())
 224     {
 225       unsigned int new_size = DF_DEFS_TABLE_SIZE () + (DF_DEFS_TABLE_SIZE () / 4);
 226       iv_ref_table = XRESIZEVEC (struct rtx_iv *, iv_ref_table, new_size);
 227       memset (&iv_ref_table[iv_ref_table_size], 0,
 228               (new_size - iv_ref_table_size) * sizeof (struct rtx_iv *));
 229       iv_ref_table_size = new_size;
 230     }
 231 }
 232
 233
 234 /* Checks whether REG is a well-behaved register.  */
 235
 236 static bool
 237 simple_reg_p (rtx reg)
 238 {
 239   unsigned r;
 240
 241   if (GET_CODE (reg) == SUBREG)
 242     {
 243       if (!subreg_lowpart_p (reg))
 244         return false;
 245       reg = SUBREG_REG (reg);
 246     }
 247
 248   if (!REG_P (reg))
 249     return false;
 250
 251   r = REGNO (reg);
 252   if (HARD_REGISTER_NUM_P (r))
 253     return false;
 254
 255   if (GET_MODE_CLASS (GET_MODE (reg)) != MODE_INT)
 256     return false;
 257
 258   return true;
 259 }
 260
 261 /* Clears the information about ivs stored in df.  */
 262
 263 static void
 264 clear_iv_info (void)
 265 {
 266   unsigned i, n_defs = DF_DEFS_TABLE_SIZE ();
 267   struct rtx_iv *iv;
 268
 269   check_iv_ref_table_size ();
 270   for (i = 0; i < n_defs; i++)
 271     {
 272       iv = iv_ref_table[i];
 273       if (iv)
 274         {
 275           free (iv);
 276           iv_ref_table[i] = NULL;
 277         }
 278     }
 279
 280   bivs->empty ();
 281 }
 282
 283
 284 /* Prepare the data for an induction variable analysis of a LOOP.  */
 285
 286 void
 287 iv_analysis_loop_init (struct loop *loop)
 288 {
 289   current_loop = loop;
 290
 291   /* Clear the information from the analysis of the previous loop.  */
 292   if (clean_slate)
 293     {
 294       df_set_flags (DF_EQ_NOTES + DF_DEFER_INSN_RESCAN);
 295       bivs = new hash_table<biv_entry_hasher> (10);
 296       clean_slate = false;
 297     }
 298   else
 299     clear_iv_info ();
 300
 301   /* Get rid of the ud chains before processing the rescans.  Then add
 302      the problem back.  */
 303   df_remove_problem (df_chain);
 304   df_process_deferred_rescans ();
 305   df_set_flags (DF_RD_PRUNE_DEAD_DEFS);
 306   df_chain_add_problem (DF_UD_CHAIN);
 307   df_note_add_problem ();
 308   df_analyze_loop (loop);
 309   if (dump_file)
 310     df_dump_region (dump_file);
 311
 312   check_iv_ref_table_size ();
 313 }
 314
 315 /* Finds the definition of REG that dominates loop latch and stores
 316    it to DEF.  Returns false if there is not a single definition
 317    dominating the latch.  If REG has no definition in loop, DEF
 318    is set to NULL and true is returned.  */
 319
 320 static bool
 321 latch_dominating_def (rtx reg, df_ref *def)
 322 {
 323   df_ref single_rd = NULL, adef;
 324   unsigned regno = REGNO (reg);
 325   struct df_rd_bb_info *bb_info = DF_RD_BB_INFO (current_loop->latch);
 326
 327   for (adef = DF_REG_DEF_CHAIN (regno); adef; adef = DF_REF_NEXT_REG (adef))
 328     {
 329       if (!bitmap_bit_p (df->blocks_to_analyze, DF_REF_BBNO (adef))
 330           || !bitmap_bit_p (&bb_info->out, DF_REF_ID (adef)))
 331         continue;
 332
 333       /* More than one reaching definition.  */
 334       if (single_rd)
 335         return false;
 336
 337       if (!just_once_each_iteration_p (current_loop, DF_REF_BB (adef)))
 338         return false;
 339
 340       single_rd = adef;
 341     }
 342
 343   *def = single_rd;
 344   return true;
 345 }
 346
 347 /* Gets definition of REG reaching its use in INSN and stores it to DEF.  */
 348
 349 static enum iv_grd_result
 350 iv_get_reaching_def (rtx_insn *insn, rtx reg, df_ref *def)
 351 {
 352   df_ref use, adef;
 353   basic_block def_bb, use_bb;
 354   rtx_insn *def_insn;
 355   bool dom_p;
 356
 357   *def = NULL;
 358   if (!simple_reg_p (reg))
 359     return GRD_INVALID;
 360   if (GET_CODE (reg) == SUBREG)
 361     reg = SUBREG_REG (reg);
 362   gcc_assert (REG_P (reg));
 363
 364   use = df_find_use (insn, reg);
 365   gcc_assert (use != NULL);
 366
 367   if (!DF_REF_CHAIN (use))
 368     return GRD_INVARIANT;
 369
 370   /* More than one reaching def.  */
 371   if (DF_REF_CHAIN (use)->next)
 372     return GRD_INVALID;
 373
 374   adef = DF_REF_CHAIN (use)->ref;
 375
 376   /* We do not handle setting only part of the register.  */
 377   if (DF_REF_FLAGS (adef) & DF_REF_READ_WRITE)
 378     return GRD_INVALID;
 379
 380   def_insn = DF_REF_INSN (adef);
 381   def_bb = DF_REF_BB (adef);
 382   use_bb = BLOCK_FOR_INSN (insn);
 383
 384   if (use_bb == def_bb)
 385     dom_p = (DF_INSN_LUID (def_insn) < DF_INSN_LUID (insn));
 386   else
 387     dom_p = dominated_by_p (CDI_DOMINATORS, use_bb, def_bb);
 388
 389   if (dom_p)
 390     {
 391       *def = adef;
 392       return GRD_SINGLE_DOM;
 393     }
 394
 395   /* The definition does not dominate the use.  This is still OK if
 396      this may be a use of a biv, i.e. if the def_bb dominates loop
 397      latch.  */
 398   if (just_once_each_iteration_p (current_loop, def_bb))
 399     return GRD_MAYBE_BIV;
 400
 401   return GRD_INVALID;
 402 }
 403
 404 /* Sets IV to invariant CST in MODE.  Always returns true (just for
 405    consistency with other iv manipulation functions that may fail).  */
 406
 407 static bool
 408 iv_constant (struct rtx_iv *iv, rtx cst, machine_mode mode)
 409 {
 410   if (mode == VOIDmode)
 411     mode = GET_MODE (cst);
 412
 413   iv->mode = mode;
 414   iv->base = cst;
 415   iv->step = const0_rtx;
 416   iv->first_special = false;
 417   iv->extend = IV_UNKNOWN_EXTEND;
 418   iv->extend_mode = iv->mode;
 419   iv->delta = const0_rtx;
 420   iv->mult = const1_rtx;
 421
 422   return true;
 423 }
 424
 425 /* Evaluates application of subreg to MODE on IV.  */
 426
 427 static bool
 428 iv_subreg (struct rtx_iv *iv, machine_mode mode)
 429 {
 430   /* If iv is invariant, just calculate the new value.  */
 431   if (iv->step == const0_rtx
 432       && !iv->first_special)
 433     {
 434       rtx val = get_iv_value (iv, const0_rtx);
 435       val = lowpart_subreg (mode, val,
 436                             iv->extend == IV_UNKNOWN_EXTEND
 437                             ? iv->mode : iv->extend_mode);
 438
 439       iv->base = val;
 440       iv->extend = IV_UNKNOWN_EXTEND;
 441       iv->mode = iv->extend_mode = mode;
 442       iv->delta = const0_rtx;
 443       iv->mult = const1_rtx;
 444       return true;
 445     }
 446
 447   if (iv->extend_mode == mode)
 448     return true;
 449
 450   if (GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (iv->mode))
 451     return false;
 452
 453   iv->extend = IV_UNKNOWN_EXTEND;
 454   iv->mode = mode;
 455
 456   iv->base = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta,
 457                                   simplify_gen_binary (MULT, iv->extend_mode,
 458                                                        iv->base, iv->mult));
 459   iv->step = simplify_gen_binary (MULT, iv->extend_mode, iv->step, iv->mult);
 460   iv->mult = const1_rtx;
 461   iv->delta = const0_rtx;
 462   iv->first_special = false;
 463
 464   return true;
 465 }
 466
 467 /* Evaluates application of EXTEND to MODE on IV.  */
 468
 469 static bool
 470 iv_extend (struct rtx_iv *iv, enum iv_extend_code extend, machine_mode mode)
 471 {
 472   /* If iv is invariant, just calculate the new value.  */
 473   if (iv->step == const0_rtx
 474       && !iv->first_special)
 475     {
 476       rtx val = get_iv_value (iv, const0_rtx);
 477       if (iv->extend_mode != iv->mode
 478           && iv->extend != IV_UNKNOWN_EXTEND
 479           && iv->extend != extend)
 480         val = lowpart_subreg (iv->mode, val, iv->extend_mode);
 481       val = simplify_gen_unary (iv_extend_to_rtx_code (extend), mode,
 482                                 val,
 483                                 iv->extend == extend
 484                                 ? iv->extend_mode : iv->mode);
 485       iv->base = val;
 486       iv->extend = IV_UNKNOWN_EXTEND;
 487       iv->mode = iv->extend_mode = mode;
 488       iv->delta = const0_rtx;
 489       iv->mult = const1_rtx;
 490       return true;
 491     }
 492
 493   if (mode != iv->extend_mode)
 494     return false;
 495
 496   if (iv->extend != IV_UNKNOWN_EXTEND
 497       && iv->extend != extend)
 498     return false;
 499
 500   iv->extend = extend;
 501
 502   return true;
 503 }
 504
 505 /* Evaluates negation of IV.  */
 506
 507 static bool
 508 iv_neg (struct rtx_iv *iv)
 509 {
 510   if (iv->extend == IV_UNKNOWN_EXTEND)
 511     {
 512       iv->base = simplify_gen_unary (NEG, iv->extend_mode,
 513                                      iv->base, iv->extend_mode);
 514       iv->step = simplify_gen_unary (NEG, iv->extend_mode,
 515                                      iv->step, iv->extend_mode);
 516     }
 517   else
 518     {
 519       iv->delta = simplify_gen_unary (NEG, iv->extend_mode,
 520                                       iv->delta, iv->extend_mode);
 521       iv->mult = simplify_gen_unary (NEG, iv->extend_mode,
 522                                      iv->mult, iv->extend_mode);
 523     }
 524
 525   return true;
 526 }
 527
 528 /* Evaluates addition or subtraction (according to OP) of IV1 to IV0.  */
 529
 530 static bool
 531 iv_add (struct rtx_iv *iv0, struct rtx_iv *iv1, enum rtx_code op)
 532 {
 533   machine_mode mode;
 534   rtx arg;
 535
 536   /* Extend the constant to extend_mode of the other operand if necessary.  */
 537   if (iv0->extend == IV_UNKNOWN_EXTEND
 538       && iv0->mode == iv0->extend_mode
 539       && iv0->step == const0_rtx
 540       && GET_MODE_SIZE (iv0->extend_mode) < GET_MODE_SIZE (iv1->extend_mode))
 541     {
 542       iv0->extend_mode = iv1->extend_mode;
 543       iv0->base = simplify_gen_unary (ZERO_EXTEND, iv0->extend_mode,
 544                                       iv0->base, iv0->mode);
 545     }
 546   if (iv1->extend == IV_UNKNOWN_EXTEND
 547       && iv1->mode == iv1->extend_mode
 548       && iv1->step == const0_rtx
 549       && GET_MODE_SIZE (iv1->extend_mode) < GET_MODE_SIZE (iv0->extend_mode))
 550     {
 551       iv1->extend_mode = iv0->extend_mode;
 552       iv1->base = simplify_gen_unary (ZERO_EXTEND, iv1->extend_mode,
 553                                       iv1->base, iv1->mode);
 554     }
 555
 556   mode = iv0->extend_mode;
 557   if (mode != iv1->extend_mode)
 558     return false;
 559
 560   if (iv0->extend == IV_UNKNOWN_EXTEND
 561       && iv1->extend == IV_UNKNOWN_EXTEND)
 562     {
 563       if (iv0->mode != iv1->mode)
 564         return false;
 565
 566       iv0->base = simplify_gen_binary (op, mode, iv0->base, iv1->base);
 567       iv0->step = simplify_gen_binary (op, mode, iv0->step, iv1->step);
 568
 569       return true;
 570     }
 571
 572   /* Handle addition of constant.  */
 573   if (iv1->extend == IV_UNKNOWN_EXTEND
 574       && iv1->mode == mode
 575       && iv1->step == const0_rtx)
 576     {
 577       iv0->delta = simplify_gen_binary (op, mode, iv0->delta, iv1->base);
 578       return true;
 579     }
 580
 581   if (iv0->extend == IV_UNKNOWN_EXTEND
 582       && iv0->mode == mode
 583       && iv0->step == const0_rtx)
 584     {
 585       arg = iv0->base;
 586       *iv0 = *iv1;
 587       if (op == MINUS
 588           && !iv_neg (iv0))
 589         return false;
 590
 591       iv0->delta = simplify_gen_binary (PLUS, mode, iv0->delta, arg);
 592       return true;
 593     }
 594
 595   return false;
 596 }
 597
 598 /* Evaluates multiplication of IV by constant CST.  */
 599
 600 static bool
 601 iv_mult (struct rtx_iv *iv, rtx mby)
 602 {
 603   machine_mode mode = iv->extend_mode;
 604
 605   if (GET_MODE (mby) != VOIDmode
 606       && GET_MODE (mby) != mode)
 607     return false;
 608
 609   if (iv->extend == IV_UNKNOWN_EXTEND)
 610     {
 611       iv->base = simplify_gen_binary (MULT, mode, iv->base, mby);
 612       iv->step = simplify_gen_binary (MULT, mode, iv->step, mby);
 613     }
 614   else
 615     {
 616       iv->delta = simplify_gen_binary (MULT, mode, iv->delta, mby);
 617       iv->mult = simplify_gen_binary (MULT, mode, iv->mult, mby);
 618     }
 619
 620   return true;
 621 }
 622
 623 /* Evaluates shift of IV by constant CST.  */
 624
 625 static bool
 626 iv_shift (struct rtx_iv *iv, rtx mby)
 627 {
 628   machine_mode mode = iv->extend_mode;
 629
 630   if (GET_MODE (mby) != VOIDmode
 631       && GET_MODE (mby) != mode)
 632     return false;
 633
 634   if (iv->extend == IV_UNKNOWN_EXTEND)
 635     {
 636       iv->base = simplify_gen_binary (ASHIFT, mode, iv->base, mby);
 637       iv->step = simplify_gen_binary (ASHIFT, mode, iv->step, mby);
 638     }
 639   else
 640     {
 641       iv->delta = simplify_gen_binary (ASHIFT, mode, iv->delta, mby);
 642       iv->mult = simplify_gen_binary (ASHIFT, mode, iv->mult, mby);
 643     }
 644
 645   return true;
 646 }
 647
 648 /* The recursive part of get_biv_step.  Gets the value of the single value
 649    defined by DEF wrto initial value of REG inside loop, in shape described
 650    at get_biv_step.  */
 651
 652 static bool
 653 get_biv_step_1 (df_ref def, rtx reg,
 654                 rtx *inner_step, machine_mode *inner_mode,
 655                 enum iv_extend_code *extend, machine_mode outer_mode,
 656                 rtx *outer_step)
 657 {
 658   rtx set, rhs, op0 = NULL_RTX, op1 = NULL_RTX;
 659   rtx next, nextr;
 660   enum rtx_code code;
 661   rtx_insn *insn = DF_REF_INSN (def);
 662   df_ref next_def;
 663   enum iv_grd_result res;
 664
 665   set = single_set (insn);
 666   if (!set)
 667     return false;
 668
 669   rhs = find_reg_equal_equiv_note (insn);
 670   if (rhs)
 671     rhs = XEXP (rhs, 0);
 672   else
 673     rhs = SET_SRC (set);
 674
 675   code = GET_CODE (rhs);
 676   switch (code)
 677     {
 678     case SUBREG:
 679     case REG:
 680       next = rhs;
 681       break;
 682
 683     case PLUS:
 684     case MINUS:
 685       op0 = XEXP (rhs, 0);
 686       op1 = XEXP (rhs, 1);
 687
 688       if (code == PLUS && CONSTANT_P (op0))
 689         std::swap (op0, op1);
 690
 691       if (!simple_reg_p (op0)
 692           || !CONSTANT_P (op1))
 693         return false;
 694
 695       if (GET_MODE (rhs) != outer_mode)
 696         {
 697           /* ppc64 uses expressions like
 698
 699              (set x:SI (plus:SI (subreg:SI y:DI) 1)).
 700
 701              this is equivalent to
 702
 703              (set x':DI (plus:DI y:DI 1))
 704              (set x:SI (subreg:SI (x':DI)).  */
 705           if (GET_CODE (op0) != SUBREG)
 706             return false;
 707           if (GET_MODE (SUBREG_REG (op0)) != outer_mode)
 708             return false;
 709         }
 710
 711       next = op0;
 712       break;
 713
 714     case SIGN_EXTEND:
 715     case ZERO_EXTEND:
 716       if (GET_MODE (rhs) != outer_mode)
 717         return false;
 718
 719       op0 = XEXP (rhs, 0);
 720       if (!simple_reg_p (op0))
 721         return false;
 722
 723       next = op0;
 724       break;
 725
 726     default:
 727       return false;
 728     }
 729
 730   if (GET_CODE (next) == SUBREG)
 731     {
 732       if (!subreg_lowpart_p (next))
 733         return false;
 734
 735       nextr = SUBREG_REG (next);
 736       if (GET_MODE (nextr) != outer_mode)
 737         return false;
 738     }
 739   else
 740     nextr = next;
 741
 742   res = iv_get_reaching_def (insn, nextr, &next_def);
 743
 744   if (res == GRD_INVALID || res == GRD_INVARIANT)
 745     return false;
 746
 747   if (res == GRD_MAYBE_BIV)
 748     {
 749       if (!rtx_equal_p (nextr, reg))
 750         return false;
 751
 752       *inner_step = const0_rtx;
 753       *extend = IV_UNKNOWN_EXTEND;
 754       *inner_mode = outer_mode;
 755       *outer_step = const0_rtx;
 756     }
 757   else if (!get_biv_step_1 (next_def, reg,
 758                             inner_step, inner_mode, extend, outer_mode,
 759                             outer_step))
 760     return false;
 761
 762   if (GET_CODE (next) == SUBREG)
 763     {
 764       machine_mode amode = GET_MODE (next);
 765
 766       if (GET_MODE_SIZE (amode) > GET_MODE_SIZE (*inner_mode))
 767         return false;
 768
 769       *inner_mode = amode;
 770       *inner_step = simplify_gen_binary (PLUS, outer_mode,
 771                                          *inner_step, *outer_step);
 772       *outer_step = const0_rtx;
 773       *extend = IV_UNKNOWN_EXTEND;
 774     }
 775
 776   switch (code)
 777     {
 778     case REG:
 779     case SUBREG:
 780       break;
 781
 782     case PLUS:
 783     case MINUS:
 784       if (*inner_mode == outer_mode
 785           /* See comment in previous switch.  */
 786           || GET_MODE (rhs) != outer_mode)
 787         *inner_step = simplify_gen_binary (code, outer_mode,
 788                                            *inner_step, op1);
 789       else
 790         *outer_step = simplify_gen_binary (code, outer_mode,
 791                                            *outer_step, op1);
 792       break;
 793
 794     case SIGN_EXTEND:
 795     case ZERO_EXTEND:
 796       gcc_assert (GET_MODE (op0) == *inner_mode
 797                   && *extend == IV_UNKNOWN_EXTEND
 798                   && *outer_step == const0_rtx);
 799
 800       *extend = (code == SIGN_EXTEND) ? IV_SIGN_EXTEND : IV_ZERO_EXTEND;
 801       break;
 802
 803     default:
 804       return false;
 805     }
 806
 807   return true;
 808 }
 809
 810 /* Gets the operation on register REG inside loop, in shape
 811
 812    OUTER_STEP + EXTEND_{OUTER_MODE} (SUBREG_{INNER_MODE} (REG + INNER_STEP))
 813
 814    If the operation cannot be described in this shape, return false.
 815    LAST_DEF is the definition of REG that dominates loop latch.  */
 816
 817 static bool
 818 get_biv_step (df_ref last_def, rtx reg, rtx *inner_step,
 819               machine_mode *inner_mode, enum iv_extend_code *extend,
 820               machine_mode *outer_mode, rtx *outer_step)
 821 {
 822   *outer_mode = GET_MODE (reg);
 823
 824   if (!get_biv_step_1 (last_def, reg,
 825                        inner_step, inner_mode, extend, *outer_mode,
 826                        outer_step))
 827     return false;
 828
 829   gcc_assert ((*inner_mode == *outer_mode) != (*extend != IV_UNKNOWN_EXTEND));
 830   gcc_assert (*inner_mode != *outer_mode || *outer_step == const0_rtx);
 831
 832   return true;
 833 }
 834
 835 /* Records information that DEF is induction variable IV.  */
 836
 837 static void
 838 record_iv (df_ref def, struct rtx_iv *iv)
 839 {
 840   struct rtx_iv *recorded_iv = XNEW (struct rtx_iv);
 841
 842   *recorded_iv = *iv;
 843   check_iv_ref_table_size ();
 844   DF_REF_IV_SET (def, recorded_iv);
 845 }
 846
 847 /* If DEF was already analyzed for bivness, store the description of the biv to
 848    IV and return true.  Otherwise return false.  */
 849
 850 static bool
 851 analyzed_for_bivness_p (rtx def, struct rtx_iv *iv)
 852 {
 853   struct biv_entry *biv = bivs->find_with_hash (def, REGNO (def));
 854
 855   if (!biv)
 856     return false;
 857
 858   *iv = biv->iv;
 859   return true;
 860 }
 861
 862 static void
 863 record_biv (rtx def, struct rtx_iv *iv)
 864 {
 865   struct biv_entry *biv = XNEW (struct biv_entry);
 866   biv_entry **slot = bivs->find_slot_with_hash (def, REGNO (def), INSERT);
 867
 868   biv->regno = REGNO (def);
 869   biv->iv = *iv;
 870   gcc_assert (!*slot);
 871   *slot = biv;
 872 }
 873
 874 /* Determines whether DEF is a biv and if so, stores its description
 875    to *IV.  */
 876
 877 static bool
 878 iv_analyze_biv (rtx def, struct rtx_iv *iv)
 879 {
 880   rtx inner_step, outer_step;
 881   machine_mode inner_mode, outer_mode;
 882   enum iv_extend_code extend;
 883   df_ref last_def;
 884
 885   if (dump_file)
 886     {
 887       fprintf (dump_file, "Analyzing ");
 888       print_rtl (dump_file, def);
 889       fprintf (dump_file, " for bivness.\n");
 890     }
 891
 892   if (!REG_P (def))
 893     {
 894       if (!CONSTANT_P (def))
 895         return false;
 896
 897       return iv_constant (iv, def, VOIDmode);
 898     }
 899
 900   if (!latch_dominating_def (def, &last_def))
 901     {
 902       if (dump_file)
 903         fprintf (dump_file, "  not simple.\n");
 904       return false;
 905     }
 906
 907   if (!last_def)
 908     return iv_constant (iv, def, VOIDmode);
 909
 910   if (analyzed_for_bivness_p (def, iv))
 911     {
 912       if (dump_file)
 913         fprintf (dump_file, "  already analysed.\n");
 914       return iv->base != NULL_RTX;
 915     }
 916
 917   if (!get_biv_step (last_def, def, &inner_step, &inner_mode, &extend,
 918                      &outer_mode, &outer_step))
 919     {
 920       iv->base = NULL_RTX;
 921       goto end;
 922     }
 923
 924   /* Loop transforms base to es (base + inner_step) + outer_step,
 925      where es means extend of subreg between inner_mode and outer_mode.
 926      The corresponding induction variable is
 927
 928      es ((base - outer_step) + i * (inner_step + outer_step)) + outer_step  */
 929
 930   iv->base = simplify_gen_binary (MINUS, outer_mode, def, outer_step);
 931   iv->step = simplify_gen_binary (PLUS, outer_mode, inner_step, outer_step);
 932   iv->mode = inner_mode;
 933   iv->extend_mode = outer_mode;
 934   iv->extend = extend;
 935   iv->mult = const1_rtx;
 936   iv->delta = outer_step;
 937   iv->first_special = inner_mode != outer_mode;
 938
 939  end:
 940   if (dump_file)
 941     {
 942       fprintf (dump_file, "  ");
 943       dump_iv_info (dump_file, iv);
 944       fprintf (dump_file, "\n");
 945     }
 946
 947   record_biv (def, iv);
 948   return iv->base != NULL_RTX;
 949 }
 950
 951 /* Analyzes expression RHS used at INSN and stores the result to *IV.
 952    The mode of the induction variable is MODE.  */
 953
 954 bool
 955 iv_analyze_expr (rtx_insn *insn, rtx rhs, machine_mode mode,
 956                  struct rtx_iv *iv)
 957 {
 958   rtx mby = NULL_RTX;
 959   rtx op0 = NULL_RTX, op1 = NULL_RTX;
 960   struct rtx_iv iv0, iv1;
 961   enum rtx_code code = GET_CODE (rhs);
 962   machine_mode omode = mode;
 963
 964   iv->mode = VOIDmode;
 965   iv->base = NULL_RTX;
 966   iv->step = NULL_RTX;
 967
 968   gcc_assert (GET_MODE (rhs) == mode || GET_MODE (rhs) == VOIDmode);
 969
 970   if (CONSTANT_P (rhs)
 971       || REG_P (rhs)
 972       || code == SUBREG)
 973     {
 974       if (!iv_analyze_op (insn, rhs, iv))
 975         return false;
 976
 977       if (iv->mode == VOIDmode)
 978         {
 979           iv->mode = mode;
 980           iv->extend_mode = mode;
 981         }
 982
 983       return true;
 984     }
 985
 986   switch (code)
 987     {
 988     case REG:
 989       op0 = rhs;
 990       break;
 991
 992     case SIGN_EXTEND:
 993     case ZERO_EXTEND:
 994     case NEG:
 995       op0 = XEXP (rhs, 0);
 996       omode = GET_MODE (op0);
 997       break;
 998
 999     case PLUS:
1000     case MINUS:
1001       op0 = XEXP (rhs, 0);
1002       op1 = XEXP (rhs, 1);
1003       break;
1004
1005     case MULT:
1006       op0 = XEXP (rhs, 0);
1007       mby = XEXP (rhs, 1);
1008       if (!CONSTANT_P (mby))
1009         std::swap (op0, mby);
1010       if (!CONSTANT_P (mby))
1011         return false;
1012       break;
1013
1014     case ASHIFT:
1015       op0 = XEXP (rhs, 0);
1016       mby = XEXP (rhs, 1);
1017       if (!CONSTANT_P (mby))
1018         return false;
1019       break;
1020
1021     default:
1022       return false;
1023     }
1024
1025   if (op0
1026       && !iv_analyze_expr (insn, op0, omode, &iv0))
1027     return false;
1028
1029   if (op1
1030       && !iv_analyze_expr (insn, op1, omode, &iv1))
1031     return false;
1032
1033   switch (code)
1034     {
1035     case SIGN_EXTEND:
1036       if (!iv_extend (&iv0, IV_SIGN_EXTEND, mode))
1037         return false;
1038       break;
1039
1040     case ZERO_EXTEND:
1041       if (!iv_extend (&iv0, IV_ZERO_EXTEND, mode))
1042         return false;
1043       break;
1044
1045     case NEG:
1046       if (!iv_neg (&iv0))
1047         return false;
1048       break;
1049
1050     case PLUS:
1051     case MINUS:
1052       if (!iv_add (&iv0, &iv1, code))
1053         return false;
1054       break;
1055
1056     case MULT:
1057       if (!iv_mult (&iv0, mby))
1058         return false;
1059       break;
1060
1061     case ASHIFT:
1062       if (!iv_shift (&iv0, mby))
1063         return false;
1064       break;
1065
1066     default:
1067       break;
1068     }
1069
1070   *iv = iv0;
1071   return iv->base != NULL_RTX;
1072 }
1073
1074 /* Analyzes iv DEF and stores the result to *IV.  */
1075
1076 static bool
1077 iv_analyze_def (df_ref def, struct rtx_iv *iv)
1078 {
1079   rtx_insn *insn = DF_REF_INSN (def);
1080   rtx reg = DF_REF_REG (def);
1081   rtx set, rhs;
1082
1083   if (dump_file)
1084     {
1085       fprintf (dump_file, "Analyzing def of ");
1086       print_rtl (dump_file, reg);
1087       fprintf (dump_file, " in insn ");
1088       print_rtl_single (dump_file, insn);
1089     }
1090
1091   check_iv_ref_table_size ();
1092   if (DF_REF_IV (def))
1093     {
1094       if (dump_file)
1095         fprintf (dump_file, "  already analysed.\n");
1096       *iv = *DF_REF_IV (def);
1097       return iv->base != NULL_RTX;
1098     }
1099
1100   iv->mode = VOIDmode;
1101   iv->base = NULL_RTX;
1102   iv->step = NULL_RTX;
1103
1104   if (!REG_P (reg))
1105     return false;
1106
1107   set = single_set (insn);
1108   if (!set)
1109     return false;
1110
1111   if (!REG_P (SET_DEST (set)))
1112     return false;
1113
1114   gcc_assert (SET_DEST (set) == reg);
1115   rhs = find_reg_equal_equiv_note (insn);
1116   if (rhs)
1117     rhs = XEXP (rhs, 0);
1118   else
1119     rhs = SET_SRC (set);
1120
1121   iv_analyze_expr (insn, rhs, GET_MODE (reg), iv);
1122   record_iv (def, iv);
1123
1124   if (dump_file)
1125     {
1126       print_rtl (dump_file, reg);
1127       fprintf (dump_file, " in insn ");
1128       print_rtl_single (dump_file, insn);
1129       fprintf (dump_file, "  is ");
1130       dump_iv_info (dump_file, iv);
1131       fprintf (dump_file, "\n");
1132     }
1133
1134   return iv->base != NULL_RTX;
1135 }
1136
1137 /* Analyzes operand OP of INSN and stores the result to *IV.  */
1138
1139 static bool
1140 iv_analyze_op (rtx_insn *insn, rtx op, struct rtx_iv *iv)
1141 {
1142   df_ref def = NULL;
1143   enum iv_grd_result res;
1144
1145   if (dump_file)
1146     {
1147       fprintf (dump_file, "Analyzing operand ");
1148       print_rtl (dump_file, op);
1149       fprintf (dump_file, " of insn ");
1150       print_rtl_single (dump_file, insn);
1151     }
1152
1153   if (function_invariant_p (op))
1154     res = GRD_INVARIANT;
1155   else if (GET_CODE (op) == SUBREG)
1156     {
1157       if (!subreg_lowpart_p (op))
1158         return false;
1159
1160       if (!iv_analyze_op (insn, SUBREG_REG (op), iv))
1161         return false;
1162
1163       return iv_subreg (iv, GET_MODE (op));
1164     }
1165   else
1166     {
1167       res = iv_get_reaching_def (insn, op, &def);
1168       if (res == GRD_INVALID)
1169         {
1170           if (dump_file)
1171             fprintf (dump_file, "  not simple.\n");
1172           return false;
1173         }
1174     }
1175
1176   if (res == GRD_INVARIANT)
1177     {
1178       iv_constant (iv, op, VOIDmode);
1179
1180       if (dump_file)
1181         {
1182           fprintf (dump_file, "  ");
1183           dump_iv_info (dump_file, iv);
1184           fprintf (dump_file, "\n");
1185         }
1186       return true;
1187     }
1188
1189   if (res == GRD_MAYBE_BIV)
1190     return iv_analyze_biv (op, iv);
1191
1192   return iv_analyze_def (def, iv);
1193 }
1194
1195 /* Analyzes value VAL at INSN and stores the result to *IV.  */
1196
1197 bool
1198 iv_analyze (rtx_insn *insn, rtx val, struct rtx_iv *iv)
1199 {
1200   rtx reg;
1201
1202   /* We must find the insn in that val is used, so that we get to UD chains.
1203      Since the function is sometimes called on result of get_condition,
1204      this does not necessarily have to be directly INSN; scan also the
1205      following insns.  */
1206   if (simple_reg_p (val))
1207     {
1208       if (GET_CODE (val) == SUBREG)
1209         reg = SUBREG_REG (val);
1210       else
1211         reg = val;
1212
1213       while (!df_find_use (insn, reg))
1214         insn = NEXT_INSN (insn);
1215     }
1216
1217   return iv_analyze_op (insn, val, iv);
1218 }
1219
1220 /* Analyzes definition of DEF in INSN and stores the result to IV.  */
1221
1222 bool
1223 iv_analyze_result (rtx_insn *insn, rtx def, struct rtx_iv *iv)
1224 {
1225   df_ref adef;
1226
1227   adef = df_find_def (insn, def);
1228   if (!adef)
1229     return false;
1230
1231   return iv_analyze_def (adef, iv);
1232 }
1233
1234 /* Checks whether definition of register REG in INSN is a basic induction
1235    variable.  IV analysis must have been initialized (via a call to
1236    iv_analysis_loop_init) for this function to produce a result.  */
1237
1238 bool
1239 biv_p (rtx_insn *insn, rtx reg)
1240 {
1241   struct rtx_iv iv;
1242   df_ref def, last_def;
1243
1244   if (!simple_reg_p (reg))
1245     return false;
1246
1247   def = df_find_def (insn, reg);
1248   gcc_assert (def != NULL);
1249   if (!latch_dominating_def (reg, &last_def))
1250     return false;
1251   if (last_def != def)
1252     return false;
1253
1254   if (!iv_analyze_biv (reg, &iv))
1255     return false;
1256
1257   return iv.step != const0_rtx;
1258 }
1259
1260 /* Calculates value of IV at ITERATION-th iteration.  */
1261
1262 rtx
1263 get_iv_value (struct rtx_iv *iv, rtx iteration)
1264 {
1265   rtx val;
1266
1267   /* We would need to generate some if_then_else patterns, and so far
1268      it is not needed anywhere.  */
1269   gcc_assert (!iv->first_special);
1270
1271   if (iv->step != const0_rtx && iteration != const0_rtx)
1272     val = simplify_gen_binary (PLUS, iv->extend_mode, iv->base,
1273                                simplify_gen_binary (MULT, iv->extend_mode,
1274                                                     iv->step, iteration));
1275   else
1276     val = iv->base;
1277
1278   if (iv->extend_mode == iv->mode)
1279     return val;
1280
1281   val = lowpart_subreg (iv->mode, val, iv->extend_mode);
1282
1283   if (iv->extend == IV_UNKNOWN_EXTEND)
1284     return val;
1285
1286   val = simplify_gen_unary (iv_extend_to_rtx_code (iv->extend),
1287                             iv->extend_mode, val, iv->mode);
1288   val = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta,
1289                              simplify_gen_binary (MULT, iv->extend_mode,
1290                                                   iv->mult, val));
1291
1292   return val;
1293 }
1294
1295 /* Free the data for an induction variable analysis.  */
1296
1297 void
1298 iv_analysis_done (void)
1299 {
1300   if (!clean_slate)
1301     {
1302       clear_iv_info ();
1303       clean_slate = true;
1304       df_finish_pass (true);
1305       delete bivs;
1306       bivs = NULL;
1307       free (iv_ref_table);
1308       iv_ref_table = NULL;
1309       iv_ref_table_size = 0;
1310     }
1311 }
1312
1313 /* Computes inverse to X modulo (1 << MOD).  */
1314
1315 static uint64_t
1316 inverse (uint64_t x, int mod)
1317 {
1318   uint64_t mask =
1319           ((uint64_t) 1 << (mod - 1) << 1) - 1;
1320   uint64_t rslt = 1;
1321   int i;
1322
1323   for (i = 0; i < mod - 1; i++)
1324     {
1325       rslt = (rslt * x) & mask;
1326       x = (x * x) & mask;
1327     }
1328
1329   return rslt;
1330 }
1331
1332 /* Checks whether any register in X is in set ALT.  */
1333
1334 static bool
1335 altered_reg_used (const_rtx x, bitmap alt)
1336 {
1337   subrtx_iterator::array_type array;
1338   FOR_EACH_SUBRTX (iter, array, x, NONCONST)
1339     {
1340       const_rtx x = *iter;
1341       if (REG_P (x) && REGNO_REG_SET_P (alt, REGNO (x)))
1342         return true;
1343     }
1344   return false;
1345 }
1346
1347 /* Marks registers altered by EXPR in set ALT.  */
1348
1349 static void
1350 mark_altered (rtx expr, const_rtx by ATTRIBUTE_UNUSED, void *alt)
1351 {
1352   if (GET_CODE (expr) == SUBREG)
1353     expr = SUBREG_REG (expr);
1354   if (!REG_P (expr))
1355     return;
1356
1357   SET_REGNO_REG_SET ((bitmap) alt, REGNO (expr));
1358 }
1359
1360 /* Checks whether RHS is simple enough to process.  */
1361
1362 static bool
1363 simple_rhs_p (rtx rhs)
1364 {
1365   rtx op0, op1;
1366
1367   if (function_invariant_p (rhs)
1368       || (REG_P (rhs) && !HARD_REGISTER_P (rhs)))
1369     return true;
1370
1371   switch (GET_CODE (rhs))
1372     {
1373     case PLUS:
1374     case MINUS:
1375     case AND:
1376       op0 = XEXP (rhs, 0);
1377       op1 = XEXP (rhs, 1);
1378       /* Allow reg OP const and reg OP reg.  */
1379       if (!(REG_P (op0) && !HARD_REGISTER_P (op0))
1380           && !function_invariant_p (op0))
1381         return false;
1382       if (!(REG_P (op1) && !HARD_REGISTER_P (op1))
1383           && !function_invariant_p (op1))
1384         return false;
1385
1386       return true;
1387
1388     case ASHIFT:
1389     case ASHIFTRT:
1390     case LSHIFTRT:
1391     case MULT:
1392       op0 = XEXP (rhs, 0);
1393       op1 = XEXP (rhs, 1);
1394       /* Allow reg OP const.  */
1395       if (!(REG_P (op0) && !HARD_REGISTER_P (op0)))
1396         return false;
1397       if (!function_invariant_p (op1))
1398         return false;
1399
1400       return true;
1401
1402     default:
1403       return false;
1404     }
1405 }
1406
1407 /* If REGNO has a single definition, return its known value, otherwise return
1408    null.  */
1409
1410 static rtx
1411 find_single_def_src (unsigned int regno)
1412 {
1413   df_ref adef;
1414   rtx set, src;
1415
1416   for (;;)
1417     {
1418       rtx note;
1419       adef = DF_REG_DEF_CHAIN (regno);
1420       if (adef == NULL || DF_REF_NEXT_REG (adef) != NULL
1421           || DF_REF_IS_ARTIFICIAL (adef))
1422         return NULL_RTX;
1423
1424       set = single_set (DF_REF_INSN (adef));
1425       if (set == NULL || !REG_P (SET_DEST (set))
1426           || REGNO (SET_DEST (set)) != regno)
1427         return NULL_RTX;
1428
1429       note = find_reg_equal_equiv_note (DF_REF_INSN (adef));
1430
1431       if (note && function_invariant_p (XEXP (note, 0)))
1432         {
1433           src = XEXP (note, 0);
1434           break;
1435         }
1436       src = SET_SRC (set);
1437
1438       if (REG_P (src))
1439         {
1440           regno = REGNO (src);
1441           continue;
1442         }
1443       break;
1444     }
1445   if (!function_invariant_p (src))
1446     return NULL_RTX;
1447
1448   return src;
1449 }
1450
1451 /* If any registers in *EXPR that have a single definition, try to replace
1452    them with the known-equivalent values.  */
1453
1454 static void
1455 replace_single_def_regs (rtx *expr)
1456 {
1457   subrtx_var_iterator::array_type array;
1458  repeat:
1459   FOR_EACH_SUBRTX_VAR (iter, array, *expr, NONCONST)
1460     {
1461       rtx x = *iter;
1462       if (REG_P (x))
1463         if (rtx new_x = find_single_def_src (REGNO (x)))
1464           {
1465             *expr = simplify_replace_rtx (*expr, x, new_x);
1466             goto repeat;
1467           }
1468     }
1469 }
1470
1471 /* A subroutine of simplify_using_initial_values, this function examines INSN
1472    to see if it contains a suitable set that we can use to make a replacement.
1473    If it is suitable, return true and set DEST and SRC to the lhs and rhs of
1474    the set; return false otherwise.  */
1475
1476 static bool
1477 suitable_set_for_replacement (rtx_insn *insn, rtx *dest, rtx *src)
1478 {
1479   rtx set = single_set (insn);
1480   rtx lhs = NULL_RTX, rhs;
1481
1482   if (!set)
1483     return false;
1484
1485   lhs = SET_DEST (set);
1486   if (!REG_P (lhs))
1487     return false;
1488
1489   rhs = find_reg_equal_equiv_note (insn);
1490   if (rhs)
1491     rhs = XEXP (rhs, 0);
1492   else
1493     rhs = SET_SRC (set);
1494
1495   if (!simple_rhs_p (rhs))
1496     return false;
1497
1498   *dest = lhs;
1499   *src = rhs;
1500   return true;
1501 }
1502
1503 /* Using the data returned by suitable_set_for_replacement, replace DEST
1504    with SRC in *EXPR and return the new expression.  Also call
1505    replace_single_def_regs if the replacement changed something.  */
1506 static void
1507 replace_in_expr (rtx *expr, rtx dest, rtx src)
1508 {
1509   rtx old = *expr;
1510   *expr = simplify_replace_rtx (*expr, dest, src);
1511   if (old == *expr)
1512     return;
1513   replace_single_def_regs (expr);
1514 }
1515
1516 /* Checks whether A implies B.  */
1517
1518 static bool
1519 implies_p (rtx a, rtx b)
1520 {
1521   rtx op0, op1, opb0, opb1;
1522   machine_mode mode;
1523
1524   if (rtx_equal_p (a, b))
1525     return true;
1526
1527   if (GET_CODE (a) == EQ)
1528     {
1529       op0 = XEXP (a, 0);
1530       op1 = XEXP (a, 1);
1531
1532       if (REG_P (op0)
1533           || (GET_CODE (op0) == SUBREG
1534               && REG_P (SUBREG_REG (op0))))
1535         {
1536           rtx r = simplify_replace_rtx (b, op0, op1);
1537           if (r == const_true_rtx)
1538             return true;
1539         }
1540
1541       if (REG_P (op1)
1542           || (GET_CODE (op1) == SUBREG
1543               && REG_P (SUBREG_REG (op1))))
1544         {
1545           rtx r = simplify_replace_rtx (b, op1, op0);
1546           if (r == const_true_rtx)
1547             return true;
1548         }
1549     }
1550
1551   if (b == const_true_rtx)
1552     return true;
1553
1554   if ((GET_RTX_CLASS (GET_CODE (a)) != RTX_COMM_COMPARE
1555        && GET_RTX_CLASS (GET_CODE (a)) != RTX_COMPARE)
1556       || (GET_RTX_CLASS (GET_CODE (b)) != RTX_COMM_COMPARE
1557           && GET_RTX_CLASS (GET_CODE (b)) != RTX_COMPARE))
1558     return false;
1559
1560   op0 = XEXP (a, 0);
1561   op1 = XEXP (a, 1);
1562   opb0 = XEXP (b, 0);
1563   opb1 = XEXP (b, 1);
1564
1565   mode = GET_MODE (op0);
1566   if (mode != GET_MODE (opb0))
1567     mode = VOIDmode;
1568   else if (mode == VOIDmode)
1569     {
1570       mode = GET_MODE (op1);
1571       if (mode != GET_MODE (opb1))
1572         mode = VOIDmode;
1573     }
1574
1575   /* A < B implies A + 1 <= B.  */
1576   if ((GET_CODE (a) == GT || GET_CODE (a) == LT)
1577       && (GET_CODE (b) == GE || GET_CODE (b) == LE))
1578     {
1579
1580       if (GET_CODE (a) == GT)
1581         std::swap (op0, op1);
1582
1583       if (GET_CODE (b) == GE)
1584         std::swap (opb0, opb1);
1585
1586       if (SCALAR_INT_MODE_P (mode)
1587           && rtx_equal_p (op1, opb1)
1588           && simplify_gen_binary (MINUS, mode, opb0, op0) == const1_rtx)
1589         return true;
1590       return false;
1591     }
1592
1593   /* A < B or A > B imply A != B.  TODO: Likewise
1594      A + n < B implies A != B + n if neither wraps.  */
1595   if (GET_CODE (b) == NE
1596       && (GET_CODE (a) == GT || GET_CODE (a) == GTU
1597           || GET_CODE (a) == LT || GET_CODE (a) == LTU))
1598     {
1599       if (rtx_equal_p (op0, opb0)
1600           && rtx_equal_p (op1, opb1))
1601         return true;
1602     }
1603
1604   /* For unsigned comparisons, A != 0 implies A > 0 and A >= 1.  */
1605   if (GET_CODE (a) == NE
1606       && op1 == const0_rtx)
1607     {
1608       if ((GET_CODE (b) == GTU
1609            && opb1 == const0_rtx)
1610           || (GET_CODE (b) == GEU
1611               && opb1 == const1_rtx))
1612         return rtx_equal_p (op0, opb0);
1613     }
1614
1615   /* A != N is equivalent to A - (N + 1) <u -1.  */
1616   if (GET_CODE (a) == NE
1617       && CONST_INT_P (op1)
1618       && GET_CODE (b) == LTU
1619       && opb1 == constm1_rtx
1620       && GET_CODE (opb0) == PLUS
1621       && CONST_INT_P (XEXP (opb0, 1))
1622       /* Avoid overflows.  */
1623       && ((unsigned HOST_WIDE_INT) INTVAL (XEXP (opb0, 1))
1624           != ((unsigned HOST_WIDE_INT)1
1625               << (HOST_BITS_PER_WIDE_INT - 1)) - 1)
1626       && INTVAL (XEXP (opb0, 1)) + 1 == -INTVAL (op1))
1627     return rtx_equal_p (op0, XEXP (opb0, 0));
1628
1629   /* Likewise, A != N implies A - N > 0.  */
1630   if (GET_CODE (a) == NE
1631       && CONST_INT_P (op1))
1632     {
1633       if (GET_CODE (b) == GTU
1634           && GET_CODE (opb0) == PLUS
1635           && opb1 == const0_rtx
1636           && CONST_INT_P (XEXP (opb0, 1))
1637           /* Avoid overflows.  */
1638           && ((unsigned HOST_WIDE_INT) INTVAL (XEXP (opb0, 1))
1639               != ((unsigned HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT - 1)))
1640           && rtx_equal_p (XEXP (opb0, 0), op0))
1641         return INTVAL (op1) == -INTVAL (XEXP (opb0, 1));
1642       if (GET_CODE (b) == GEU
1643           && GET_CODE (opb0) == PLUS
1644           && opb1 == const1_rtx
1645           && CONST_INT_P (XEXP (opb0, 1))
1646           /* Avoid overflows.  */
1647           && ((unsigned HOST_WIDE_INT) INTVAL (XEXP (opb0, 1))
1648               != ((unsigned HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT - 1)))
1649           && rtx_equal_p (XEXP (opb0, 0), op0))
1650         return INTVAL (op1) == -INTVAL (XEXP (opb0, 1));
1651     }
1652
1653   /* A >s X, where X is positive, implies A <u Y, if Y is negative.  */
1654   if ((GET_CODE (a) == GT || GET_CODE (a) == GE)
1655       && CONST_INT_P (op1)
1656       && ((GET_CODE (a) == GT && op1 == constm1_rtx)
1657           || INTVAL (op1) >= 0)
1658       && GET_CODE (b) == LTU
1659       && CONST_INT_P (opb1)
1660       && rtx_equal_p (op0, opb0))
1661     return INTVAL (opb1) < 0;
1662
1663   return false;
1664 }
1665
1666 /* Canonicalizes COND so that
1667
1668    (1) Ensure that operands are ordered according to
1669        swap_commutative_operands_p.
1670    (2) (LE x const) will be replaced with (LT x <const+1>) and similarly
1671        for GE, GEU, and LEU.  */
1672
1673 rtx
1674 canon_condition (rtx cond)
1675 {
1676   rtx op0, op1;
1677   enum rtx_code code;
1678   machine_mode mode;
1679
1680   code = GET_CODE (cond);
1681   op0 = XEXP (cond, 0);
1682   op1 = XEXP (cond, 1);
1683
1684   if (swap_commutative_operands_p (op0, op1))
1685     {
1686       code = swap_condition (code);
1687       std::swap (op0, op1);
1688     }
1689
1690   mode = GET_MODE (op0);
1691   if (mode == VOIDmode)
1692     mode = GET_MODE (op1);
1693   gcc_assert (mode != VOIDmode);
1694
1695   if (CONST_SCALAR_INT_P (op1) && GET_MODE_CLASS (mode) != MODE_CC)
1696     {
1697       rtx_mode_t const_val (op1, mode);
1698
1699       switch (code)
1700         {
1701         case LE:
1702           if (wi::ne_p (const_val, wi::max_value (mode, SIGNED)))
1703             {
1704               code = LT;
1705               op1 = immed_wide_int_const (wi::add (const_val, 1),  mode);
1706             }
1707           break;
1708
1709         case GE:
1710           if (wi::ne_p (const_val, wi::min_value (mode, SIGNED)))
1711             {
1712               code = GT;
1713               op1 = immed_wide_int_const (wi::sub (const_val, 1), mode);
1714             }
1715           break;
1716
1717         case LEU:
1718           if (wi::ne_p (const_val, -1))
1719             {
1720               code = LTU;
1721               op1 = immed_wide_int_const (wi::add (const_val, 1), mode);
1722             }
1723           break;
1724
1725         case GEU:
1726           if (wi::ne_p (const_val, 0))
1727             {
1728               code = GTU;
1729               op1 = immed_wide_int_const (wi::sub (const_val, 1), mode);
1730             }
1731           break;
1732
1733         default:
1734           break;
1735         }
1736     }
1737
1738   if (op0 != XEXP (cond, 0)
1739       || op1 != XEXP (cond, 1)
1740       || code != GET_CODE (cond)
1741       || GET_MODE (cond) != SImode)
1742     cond = gen_rtx_fmt_ee (code, SImode, op0, op1);
1743
1744   return cond;
1745 }
1746
1747 /* Reverses CONDition; returns NULL if we cannot.  */
1748
1749 static rtx
1750 reversed_condition (rtx cond)
1751 {
1752   enum rtx_code reversed;
1753   reversed = reversed_comparison_code (cond, NULL);
1754   if (reversed == UNKNOWN)
1755     return NULL_RTX;
1756   else
1757     return gen_rtx_fmt_ee (reversed,
1758                            GET_MODE (cond), XEXP (cond, 0),
1759                            XEXP (cond, 1));
1760 }
1761
1762 /* Tries to use the fact that COND holds to simplify EXPR.  ALTERED is the
1763    set of altered regs.  */
1764
1765 void
1766 simplify_using_condition (rtx cond, rtx *expr, regset altered)
1767 {
1768   rtx rev, reve, exp = *expr;
1769
1770   /* If some register gets altered later, we do not really speak about its
1771      value at the time of comparison.  */
1772   if (altered && altered_reg_used (cond, altered))
1773     return;
1774
1775   if (GET_CODE (cond) == EQ
1776       && REG_P (XEXP (cond, 0)) && CONSTANT_P (XEXP (cond, 1)))
1777     {
1778       *expr = simplify_replace_rtx (*expr, XEXP (cond, 0), XEXP (cond, 1));
1779       return;
1780     }
1781
1782   if (!COMPARISON_P (exp))
1783     return;
1784
1785   rev = reversed_condition (cond);
1786   reve = reversed_condition (exp);
1787
1788   cond = canon_condition (cond);
1789   exp = canon_condition (exp);
1790   if (rev)
1791     rev = canon_condition (rev);
1792   if (reve)
1793     reve = canon_condition (reve);
1794
1795   if (rtx_equal_p (exp, cond))
1796     {
1797       *expr = const_true_rtx;
1798       return;
1799     }
1800
1801   if (rev && rtx_equal_p (exp, rev))
1802     {
1803       *expr = const0_rtx;
1804       return;
1805     }
1806
1807   if (implies_p (cond, exp))
1808     {
1809       *expr = const_true_rtx;
1810       return;
1811     }
1812
1813   if (reve && implies_p (cond, reve))
1814     {
1815       *expr = const0_rtx;
1816       return;
1817     }
1818
1819   /* A proof by contradiction.  If *EXPR implies (not cond), *EXPR must
1820      be false.  */
1821   if (rev && implies_p (exp, rev))
1822     {
1823       *expr = const0_rtx;
1824       return;
1825     }
1826
1827   /* Similarly, If (not *EXPR) implies (not cond), *EXPR must be true.  */
1828   if (rev && reve && implies_p (reve, rev))
1829     {
1830       *expr = const_true_rtx;
1831       return;
1832     }
1833
1834   /* We would like to have some other tests here.  TODO.  */
1835
1836   return;
1837 }
1838
1839 /* Use relationship between A and *B to eventually eliminate *B.
1840    OP is the operation we consider.  */
1841
1842 static void
1843 eliminate_implied_condition (enum rtx_code op, rtx a, rtx *b)
1844 {
1845   switch (op)
1846     {
1847     case AND:
1848       /* If A implies *B, we may replace *B by true.  */
1849       if (implies_p (a, *b))
1850         *b = const_true_rtx;
1851       break;
1852
1853     case IOR:
1854       /* If *B implies A, we may replace *B by false.  */
1855       if (implies_p (*b, a))
1856         *b = const0_rtx;
1857       break;
1858
1859     default:
1860       gcc_unreachable ();
1861     }
1862 }
1863
1864 /* Eliminates the conditions in TAIL that are implied by HEAD.  OP is the
1865    operation we consider.  */
1866
1867 static void
1868 eliminate_implied_conditions (enum rtx_code op, rtx *head, rtx tail)
1869 {
1870   rtx elt;
1871
1872   for (elt = tail; elt; elt = XEXP (elt, 1))
1873     eliminate_implied_condition (op, *head, &XEXP (elt, 0));
1874   for (elt = tail; elt; elt = XEXP (elt, 1))
1875     eliminate_implied_condition (op, XEXP (elt, 0), head);
1876 }
1877
1878 /* Simplifies *EXPR using initial values at the start of the LOOP.  If *EXPR
1879    is a list, its elements are assumed to be combined using OP.  */
1880
1881 static void
1882 simplify_using_initial_values (struct loop *loop, enum rtx_code op, rtx *expr)
1883 {
1884   bool expression_valid;
1885   rtx head, tail, last_valid_expr;
1886   rtx_expr_list *cond_list;
1887   rtx_insn *insn;
1888   rtx neutral, aggr;
1889   regset altered, this_altered;
1890   edge e;
1891
1892   if (!*expr)
1893     return;
1894
1895   if (CONSTANT_P (*expr))
1896     return;
1897
1898   if (GET_CODE (*expr) == EXPR_LIST)
1899     {
1900       head = XEXP (*expr, 0);
1901       tail = XEXP (*expr, 1);
1902
1903       eliminate_implied_conditions (op, &head, tail);
1904
1905       switch (op)
1906         {
1907         case AND:
1908           neutral = const_true_rtx;
1909           aggr = const0_rtx;
1910           break;
1911
1912         case IOR:
1913           neutral = const0_rtx;
1914           aggr = const_true_rtx;
1915           break;
1916
1917         default:
1918           gcc_unreachable ();
1919         }
1920
1921       simplify_using_initial_values (loop, UNKNOWN, &head);
1922       if (head == aggr)
1923         {
1924           XEXP (*expr, 0) = aggr;
1925           XEXP (*expr, 1) = NULL_RTX;
1926           return;
1927         }
1928       else if (head == neutral)
1929         {
1930           *expr = tail;
1931           simplify_using_initial_values (loop, op, expr);
1932           return;
1933         }
1934       simplify_using_initial_values (loop, op, &tail);
1935
1936       if (tail && XEXP (tail, 0) == aggr)
1937         {
1938           *expr = tail;
1939           return;
1940         }
1941
1942       XEXP (*expr, 0) = head;
1943       XEXP (*expr, 1) = tail;
1944       return;
1945     }
1946
1947   gcc_assert (op == UNKNOWN);
1948
1949   replace_single_def_regs (expr);
1950   if (CONSTANT_P (*expr))
1951     return;
1952
1953   e = loop_preheader_edge (loop);
1954   if (e->src == ENTRY_BLOCK_PTR_FOR_FN (cfun))
1955     return;
1956
1957   altered = ALLOC_REG_SET (&reg_obstack);
1958   this_altered = ALLOC_REG_SET (&reg_obstack);
1959
1960   expression_valid = true;
1961   last_valid_expr = *expr;
1962   cond_list = NULL;
1963   while (1)
1964     {
1965       insn = BB_END (e->src);
1966       if (any_condjump_p (insn))
1967         {
1968           rtx cond = get_condition (BB_END (e->src), NULL, false, true);
1969
1970           if (cond && (e->flags & EDGE_FALLTHRU))
1971             cond = reversed_condition (cond);
1972           if (cond)
1973             {
1974               rtx old = *expr;
1975               simplify_using_condition (cond, expr, altered);
1976               if (old != *expr)
1977                 {
1978                   rtx note;
1979                   if (CONSTANT_P (*expr))
1980                     goto out;
1981                   for (note = cond_list; note; note = XEXP (note, 1))
1982                     {
1983                       simplify_using_condition (XEXP (note, 0), expr, altered);
1984                       if (CONSTANT_P (*expr))
1985                         goto out;
1986                     }
1987                 }
1988               cond_list = alloc_EXPR_LIST (0, cond, cond_list);
1989             }
1990         }
1991
1992       FOR_BB_INSNS_REVERSE (e->src, insn)
1993         {
1994           rtx src, dest;
1995           rtx old = *expr;
1996
1997           if (!INSN_P (insn))
1998             continue;
1999
2000           CLEAR_REG_SET (this_altered);
2001           note_stores (PATTERN (insn), mark_altered, this_altered);
2002           if (CALL_P (insn))
2003             {
2004               /* Kill all call clobbered registers.  */
2005               unsigned int i;
2006               hard_reg_set_iterator hrsi;
2007               EXECUTE_IF_SET_IN_HARD_REG_SET (regs_invalidated_by_call,
2008                                               0, i, hrsi)
2009                 SET_REGNO_REG_SET (this_altered, i);
2010             }
2011
2012           if (suitable_set_for_replacement (insn, &dest, &src))
2013             {
2014               rtx_expr_list **pnote, **pnote_next;
2015
2016               replace_in_expr (expr, dest, src);
2017               if (CONSTANT_P (*expr))
2018                 goto out;
2019
2020               for (pnote = &cond_list; *pnote; pnote = pnote_next)
2021                 {
2022                   rtx_expr_list *note = *pnote;
2023                   rtx old_cond = XEXP (note, 0);
2024
2025                   pnote_next = (rtx_expr_list **)&XEXP (note, 1);
2026                   replace_in_expr (&XEXP (note, 0), dest, src);
2027
2028                   /* We can no longer use a condition that has been simplified
2029                      to a constant, and simplify_using_condition will abort if
2030                      we try.  */
2031                   if (CONSTANT_P (XEXP (note, 0)))
2032                     {
2033                       *pnote = *pnote_next;
2034                       pnote_next = pnote;
2035                       free_EXPR_LIST_node (note);
2036                     }
2037                   /* Retry simplifications with this condition if either the
2038                      expression or the condition changed.  */
2039                   else if (old_cond != XEXP (note, 0) || old != *expr)
2040                     simplify_using_condition (XEXP (note, 0), expr, altered);
2041                 }
2042             }
2043           else
2044             {
2045               rtx_expr_list **pnote, **pnote_next;
2046
2047               /* If we did not use this insn to make a replacement, any overlap
2048                  between stores in this insn and our expression will cause the
2049                  expression to become invalid.  */
2050               if (altered_reg_used (*expr, this_altered))
2051                 goto out;
2052
2053               /* Likewise for the conditions.  */
2054               for (pnote = &cond_list; *pnote; pnote = pnote_next)
2055                 {
2056                   rtx_expr_list *note = *pnote;
2057                   rtx old_cond = XEXP (note, 0);
2058
2059                   pnote_next = (rtx_expr_list **)&XEXP (note, 1);
2060                   if (altered_reg_used (old_cond, this_altered))
2061                     {
2062                       *pnote = *pnote_next;
2063                       pnote_next = pnote;
2064                       free_EXPR_LIST_node (note);
2065                     }
2066                 }
2067             }
2068
2069           if (CONSTANT_P (*expr))
2070             goto out;
2071
2072           IOR_REG_SET (altered, this_altered);
2073
2074           /* If the expression now contains regs that have been altered, we
2075              can't return it to the caller.  However, it is still valid for
2076              further simplification, so keep searching to see if we can
2077              eventually turn it into a constant.  */
2078           if (altered_reg_used (*expr, altered))
2079             expression_valid = false;
2080           if (expression_valid)
2081             last_valid_expr = *expr;
2082         }
2083
2084       if (!single_pred_p (e->src)
2085           || single_pred (e->src) == ENTRY_BLOCK_PTR_FOR_FN (cfun))
2086         break;
2087       e = single_pred_edge (e->src);
2088     }
2089
2090  out:
2091   free_EXPR_LIST_list (&cond_list);
2092   if (!CONSTANT_P (*expr))
2093     *expr = last_valid_expr;
2094   FREE_REG_SET (altered);
2095   FREE_REG_SET (this_altered);
2096 }
2097
2098 /* Transforms invariant IV into MODE.  Adds assumptions based on the fact
2099    that IV occurs as left operands of comparison COND and its signedness
2100    is SIGNED_P to DESC.  */
2101
2102 static void
2103 shorten_into_mode (struct rtx_iv *iv, machine_mode mode,
2104                    enum rtx_code cond, bool signed_p, struct niter_desc *desc)
2105 {
2106   rtx mmin, mmax, cond_over, cond_under;
2107
2108   get_mode_bounds (mode, signed_p, iv->extend_mode, &mmin, &mmax);
2109   cond_under = simplify_gen_relational (LT, SImode, iv->extend_mode,
2110                                         iv->base, mmin);
2111   cond_over = simplify_gen_relational (GT, SImode, iv->extend_mode,
2112                                        iv->base, mmax);
2113
2114   switch (cond)
2115     {
2116       case LE:
2117       case LT:
2118       case LEU:
2119       case LTU:
2120         if (cond_under != const0_rtx)
2121           desc->infinite =
2122                   alloc_EXPR_LIST (0, cond_under, desc->infinite);
2123         if (cond_over != const0_rtx)
2124           desc->noloop_assumptions =
2125                   alloc_EXPR_LIST (0, cond_over, desc->noloop_assumptions);
2126         break;
2127
2128       case GE:
2129       case GT:
2130       case GEU:
2131       case GTU:
2132         if (cond_over != const0_rtx)
2133           desc->infinite =
2134                   alloc_EXPR_LIST (0, cond_over, desc->infinite);
2135         if (cond_under != const0_rtx)
2136           desc->noloop_assumptions =
2137                   alloc_EXPR_LIST (0, cond_under, desc->noloop_assumptions);
2138         break;
2139
2140       case NE:
2141         if (cond_over != const0_rtx)
2142           desc->infinite =
2143                   alloc_EXPR_LIST (0, cond_over, desc->infinite);
2144         if (cond_under != const0_rtx)
2145           desc->infinite =
2146                   alloc_EXPR_LIST (0, cond_under, desc->infinite);
2147         break;
2148
2149       default:
2150         gcc_unreachable ();
2151     }
2152
2153   iv->mode = mode;
2154   iv->extend = signed_p ? IV_SIGN_EXTEND : IV_ZERO_EXTEND;
2155 }
2156
2157 /* Transforms IV0 and IV1 compared by COND so that they are both compared as
2158    subregs of the same mode if possible (sometimes it is necessary to add
2159    some assumptions to DESC).  */
2160
2161 static bool
2162 canonicalize_iv_subregs (struct rtx_iv *iv0, struct rtx_iv *iv1,
2163                          enum rtx_code cond, struct niter_desc *desc)
2164 {
2165   machine_mode comp_mode;
2166   bool signed_p;
2167
2168   /* If the ivs behave specially in the first iteration, or are
2169      added/multiplied after extending, we ignore them.  */
2170   if (iv0->first_special || iv0->mult != const1_rtx || iv0->delta != const0_rtx)
2171     return false;
2172   if (iv1->first_special || iv1->mult != const1_rtx || iv1->delta != const0_rtx)
2173     return false;
2174
2175   /* If there is some extend, it must match signedness of the comparison.  */
2176   switch (cond)
2177     {
2178       case LE:
2179       case LT:
2180         if (iv0->extend == IV_ZERO_EXTEND
2181             || iv1->extend == IV_ZERO_EXTEND)
2182           return false;
2183         signed_p = true;
2184         break;
2185
2186       case LEU:
2187       case LTU:
2188         if (iv0->extend == IV_SIGN_EXTEND
2189             || iv1->extend == IV_SIGN_EXTEND)
2190           return false;
2191         signed_p = false;
2192         break;
2193
2194       case NE:
2195         if (iv0->extend != IV_UNKNOWN_EXTEND
2196             && iv1->extend != IV_UNKNOWN_EXTEND
2197             && iv0->extend != iv1->extend)
2198           return false;
2199
2200         signed_p = false;
2201         if (iv0->extend != IV_UNKNOWN_EXTEND)
2202           signed_p = iv0->extend == IV_SIGN_EXTEND;
2203         if (iv1->extend != IV_UNKNOWN_EXTEND)
2204           signed_p = iv1->extend == IV_SIGN_EXTEND;
2205         break;
2206
2207       default:
2208         gcc_unreachable ();
2209     }
2210
2211   /* Values of both variables should be computed in the same mode.  These
2212      might indeed be different, if we have comparison like
2213
2214      (compare (subreg:SI (iv0)) (subreg:SI (iv1)))
2215
2216      and iv0 and iv1 are both ivs iterating in SI mode, but calculated
2217      in different modes.  This does not seem impossible to handle, but
2218      it hardly ever occurs in practice.
2219
2220      The only exception is the case when one of operands is invariant.
2221      For example pentium 3 generates comparisons like
2222      (lt (subreg:HI (reg:SI)) 100).  Here we assign HImode to 100, but we
2223      definitely do not want this prevent the optimization.  */
2224   comp_mode = iv0->extend_mode;
2225   if (GET_MODE_BITSIZE (comp_mode) < GET_MODE_BITSIZE (iv1->extend_mode))
2226     comp_mode = iv1->extend_mode;
2227
2228   if (iv0->extend_mode != comp_mode)
2229     {
2230       if (iv0->mode != iv0->extend_mode
2231           || iv0->step != const0_rtx)
2232         return false;
2233
2234       iv0->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND,
2235                                       comp_mode, iv0->base, iv0->mode);
2236       iv0->extend_mode = comp_mode;
2237     }
2238
2239   if (iv1->extend_mode != comp_mode)
2240     {
2241       if (iv1->mode != iv1->extend_mode
2242           || iv1->step != const0_rtx)
2243         return false;
2244
2245       iv1->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND,
2246                                       comp_mode, iv1->base, iv1->mode);
2247       iv1->extend_mode = comp_mode;
2248     }
2249
2250   /* Check that both ivs belong to a range of a single mode.  If one of the
2251      operands is an invariant, we may need to shorten it into the common
2252      mode.  */
2253   if (iv0->mode == iv0->extend_mode
2254       && iv0->step == const0_rtx
2255       && iv0->mode != iv1->mode)
2256     shorten_into_mode (iv0, iv1->mode, cond, signed_p, desc);
2257
2258   if (iv1->mode == iv1->extend_mode
2259       && iv1->step == const0_rtx
2260       && iv0->mode != iv1->mode)
2261     shorten_into_mode (iv1, iv0->mode, swap_condition (cond), signed_p, desc);
2262
2263   if (iv0->mode != iv1->mode)
2264     return false;
2265
2266   desc->mode = iv0->mode;
2267   desc->signed_p = signed_p;
2268
2269   return true;
2270 }
2271
2272 /* Tries to estimate the maximum number of iterations in LOOP, and return the
2273    result.  This function is called from iv_number_of_iterations with
2274    a number of fields in DESC already filled in.  OLD_NITER is the original
2275    expression for the number of iterations, before we tried to simplify it.  */
2276
2277 static uint64_t
2278 determine_max_iter (struct loop *loop, struct niter_desc *desc, rtx old_niter)
2279 {
2280   rtx niter = desc->niter_expr;
2281   rtx mmin, mmax, cmp;
2282   uint64_t nmax, inc;
2283   uint64_t andmax = 0;
2284
2285   /* We used to look for constant operand 0 of AND,
2286      but canonicalization should always make this impossible.  */
2287   gcc_checking_assert (GET_CODE (niter) != AND
2288                        || !CONST_INT_P (XEXP (niter, 0)));
2289
2290   if (GET_CODE (niter) == AND
2291       && CONST_INT_P (XEXP (niter, 1)))
2292     {
2293       andmax = UINTVAL (XEXP (niter, 1));
2294       niter = XEXP (niter, 0);
2295     }
2296
2297   get_mode_bounds (desc->mode, desc->signed_p, desc->mode, &mmin, &mmax);
2298   nmax = UINTVAL (mmax) - UINTVAL (mmin);
2299
2300   if (GET_CODE (niter) == UDIV)
2301     {
2302       if (!CONST_INT_P (XEXP (niter, 1)))
2303         return nmax;
2304       inc = INTVAL (XEXP (niter, 1));
2305       niter = XEXP (niter, 0);
2306     }
2307   else
2308     inc = 1;
2309
2310   /* We could use a binary search here, but for now improving the upper
2311      bound by just one eliminates one important corner case.  */
2312   cmp = simplify_gen_relational (desc->signed_p ? LT : LTU, VOIDmode,
2313                                  desc->mode, old_niter, mmax);
2314   simplify_using_initial_values (loop, UNKNOWN, &cmp);
2315   if (cmp == const_true_rtx)
2316     {
2317       nmax--;
2318
2319       if (dump_file)
2320         fprintf (dump_file, ";; improved upper bound by one.\n");
2321     }
2322   nmax /= inc;
2323   if (andmax)
2324     nmax = MIN (nmax, andmax);
2325   if (dump_file)
2326     fprintf (dump_file, ";; Determined upper bound %" PRId64".\n",
2327              nmax);
2328   return nmax;
2329 }
2330
2331 /* Computes number of iterations of the CONDITION in INSN in LOOP and stores
2332    the result into DESC.  Very similar to determine_number_of_iterations
2333    (basically its rtl version), complicated by things like subregs.  */
2334
2335 static void
2336 iv_number_of_iterations (struct loop *loop, rtx_insn *insn, rtx condition,
2337                          struct niter_desc *desc)
2338 {
2339   rtx op0, op1, delta, step, bound, may_xform, tmp, tmp0, tmp1;
2340   struct rtx_iv iv0, iv1;
2341   rtx assumption, may_not_xform;
2342   enum rtx_code cond;
2343   machine_mode mode, comp_mode;
2344   rtx mmin, mmax, mode_mmin, mode_mmax;
2345   uint64_t s, size, d, inv, max;
2346   int64_t up, down, inc, step_val;
2347   int was_sharp = false;
2348   rtx old_niter;
2349   bool step_is_pow2;
2350
2351   /* The meaning of these assumptions is this:
2352      if !assumptions
2353        then the rest of information does not have to be valid
2354      if noloop_assumptions then the loop does not roll
2355      if infinite then this exit is never used */
2356
2357   desc->assumptions = NULL_RTX;
2358   desc->noloop_assumptions = NULL_RTX;
2359   desc->infinite = NULL_RTX;
2360   desc->simple_p = true;
2361
2362   desc->const_iter = false;
2363   desc->niter_expr = NULL_RTX;
2364
2365   cond = GET_CODE (condition);
2366   gcc_assert (COMPARISON_P (condition));
2367
2368   mode = GET_MODE (XEXP (condition, 0));
2369   if (mode == VOIDmode)
2370     mode = GET_MODE (XEXP (condition, 1));
2371   /* The constant comparisons should be folded.  */
2372   gcc_assert (mode != VOIDmode);
2373
2374   /* We only handle integers or pointers.  */
2375   if (GET_MODE_CLASS (mode) != MODE_INT
2376       && GET_MODE_CLASS (mode) != MODE_PARTIAL_INT)
2377     goto fail;
2378
2379   op0 = XEXP (condition, 0);
2380   if (!iv_analyze (insn, op0, &iv0))
2381     goto fail;
2382   if (iv0.extend_mode == VOIDmode)
2383     iv0.mode = iv0.extend_mode = mode;
2384
2385   op1 = XEXP (condition, 1);
2386   if (!iv_analyze (insn, op1, &iv1))
2387     goto fail;
2388   if (iv1.extend_mode == VOIDmode)
2389     iv1.mode = iv1.extend_mode = mode;
2390
2391   if (GET_MODE_BITSIZE (iv0.extend_mode) > HOST_BITS_PER_WIDE_INT
2392       || GET_MODE_BITSIZE (iv1.extend_mode) > HOST_BITS_PER_WIDE_INT)
2393     goto fail;
2394
2395   /* Check condition and normalize it.  */
2396
2397   switch (cond)
2398     {
2399       case GE:
2400       case GT:
2401       case GEU:
2402       case GTU:
2403         std::swap (iv0, iv1);
2404         cond = swap_condition (cond);
2405         break;
2406       case NE:
2407       case LE:
2408       case LEU:
2409       case LT:
2410       case LTU:
2411         break;
2412       default:
2413         goto fail;
2414     }
2415
2416   /* Handle extends.  This is relatively nontrivial, so we only try in some
2417      easy cases, when we can canonicalize the ivs (possibly by adding some
2418      assumptions) to shape subreg (base + i * step).  This function also fills
2419      in desc->mode and desc->signed_p.  */
2420
2421   if (!canonicalize_iv_subregs (&iv0, &iv1, cond, desc))
2422     goto fail;
2423
2424   comp_mode = iv0.extend_mode;
2425   mode = iv0.mode;
2426   size = GET_MODE_PRECISION (mode);
2427   get_mode_bounds (mode, (cond == LE || cond == LT), comp_mode, &mmin, &mmax);
2428   mode_mmin = lowpart_subreg (mode, mmin, comp_mode);
2429   mode_mmax = lowpart_subreg (mode, mmax, comp_mode);
2430
2431   if (!CONST_INT_P (iv0.step) || !CONST_INT_P (iv1.step))
2432     goto fail;
2433
2434   /* We can take care of the case of two induction variables chasing each other
2435      if the test is NE. I have never seen a loop using it, but still it is
2436      cool.  */
2437   if (iv0.step != const0_rtx && iv1.step != const0_rtx)
2438     {
2439       if (cond != NE)
2440         goto fail;
2441
2442       iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step);
2443       iv1.step = const0_rtx;
2444     }
2445
2446   iv0.step = lowpart_subreg (mode, iv0.step, comp_mode);
2447   iv1.step = lowpart_subreg (mode, iv1.step, comp_mode);
2448
2449   /* This is either infinite loop or the one that ends immediately, depending
2450      on initial values.  Unswitching should remove this kind of conditions.  */
2451   if (iv0.step == const0_rtx && iv1.step == const0_rtx)
2452     goto fail;
2453
2454   if (cond != NE)
2455     {
2456       if (iv0.step == const0_rtx)
2457         step_val = -INTVAL (iv1.step);
2458       else
2459         step_val = INTVAL (iv0.step);
2460
2461       /* Ignore loops of while (i-- < 10) type.  */
2462       if (step_val < 0)
2463         goto fail;
2464
2465       step_is_pow2 = !(step_val & (step_val - 1));
2466     }
2467   else
2468     {
2469       /* We do not care about whether the step is power of two in this
2470          case.  */
2471       step_is_pow2 = false;
2472       step_val = 0;
2473     }
2474
2475   /* Some more condition normalization.  We must record some assumptions
2476      due to overflows.  */
2477   switch (cond)
2478     {
2479       case LT:
2480       case LTU:
2481         /* We want to take care only of non-sharp relationals; this is easy,
2482            as in cases the overflow would make the transformation unsafe
2483            the loop does not roll.  Seemingly it would make more sense to want
2484            to take care of sharp relationals instead, as NE is more similar to
2485            them, but the problem is that here the transformation would be more
2486            difficult due to possibly infinite loops.  */
2487         if (iv0.step == const0_rtx)
2488           {
2489             tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2490             assumption = simplify_gen_relational (EQ, SImode, mode, tmp,
2491                                                   mode_mmax);
2492             if (assumption == const_true_rtx)
2493               goto zero_iter_simplify;
2494             iv0.base = simplify_gen_binary (PLUS, comp_mode,
2495                                             iv0.base, const1_rtx);
2496           }
2497         else
2498           {
2499             tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2500             assumption = simplify_gen_relational (EQ, SImode, mode, tmp,
2501                                                   mode_mmin);
2502             if (assumption == const_true_rtx)
2503               goto zero_iter_simplify;
2504             iv1.base = simplify_gen_binary (PLUS, comp_mode,
2505                                             iv1.base, constm1_rtx);
2506           }
2507
2508         if (assumption != const0_rtx)
2509           desc->noloop_assumptions =
2510                   alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2511         cond = (cond == LT) ? LE : LEU;
2512
2513         /* It will be useful to be able to tell the difference once more in
2514            LE -> NE reduction.  */
2515         was_sharp = true;
2516         break;
2517       default: ;
2518     }
2519
2520   /* Take care of trivially infinite loops.  */
2521   if (cond != NE)
2522     {
2523       if (iv0.step == const0_rtx)
2524         {
2525           tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2526           if (rtx_equal_p (tmp, mode_mmin))
2527             {
2528               desc->infinite =
2529                       alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX);
2530               /* Fill in the remaining fields somehow.  */
2531               goto zero_iter_simplify;
2532             }
2533         }
2534       else
2535         {
2536           tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2537           if (rtx_equal_p (tmp, mode_mmax))
2538             {
2539               desc->infinite =
2540                       alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX);
2541               /* Fill in the remaining fields somehow.  */
2542               goto zero_iter_simplify;
2543             }
2544         }
2545     }
2546
2547   /* If we can we want to take care of NE conditions instead of size
2548      comparisons, as they are much more friendly (most importantly
2549      this takes care of special handling of loops with step 1).  We can
2550      do it if we first check that upper bound is greater or equal to
2551      lower bound, their difference is constant c modulo step and that
2552      there is not an overflow.  */
2553   if (cond != NE)
2554     {
2555       if (iv0.step == const0_rtx)
2556         step = simplify_gen_unary (NEG, comp_mode, iv1.step, comp_mode);
2557       else
2558         step = iv0.step;
2559       step = lowpart_subreg (mode, step, comp_mode);
2560       delta = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base);
2561       delta = lowpart_subreg (mode, delta, comp_mode);
2562       delta = simplify_gen_binary (UMOD, mode, delta, step);
2563       may_xform = const0_rtx;
2564       may_not_xform = const_true_rtx;
2565
2566       if (CONST_INT_P (delta))
2567         {
2568           if (was_sharp && INTVAL (delta) == INTVAL (step) - 1)
2569             {
2570               /* A special case.  We have transformed condition of type
2571                  for (i = 0; i < 4; i += 4)
2572                  into
2573                  for (i = 0; i <= 3; i += 4)
2574                  obviously if the test for overflow during that transformation
2575                  passed, we cannot overflow here.  Most importantly any
2576                  loop with sharp end condition and step 1 falls into this
2577                  category, so handling this case specially is definitely
2578                  worth the troubles.  */
2579               may_xform = const_true_rtx;
2580             }
2581           else if (iv0.step == const0_rtx)
2582             {
2583               bound = simplify_gen_binary (PLUS, comp_mode, mmin, step);
2584               bound = simplify_gen_binary (MINUS, comp_mode, bound, delta);
2585               bound = lowpart_subreg (mode, bound, comp_mode);
2586               tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2587               may_xform = simplify_gen_relational (cond, SImode, mode,
2588                                                    bound, tmp);
2589               may_not_xform = simplify_gen_relational (reverse_condition (cond),
2590                                                        SImode, mode,
2591                                                        bound, tmp);
2592             }
2593           else
2594             {
2595               bound = simplify_gen_binary (MINUS, comp_mode, mmax, step);
2596               bound = simplify_gen_binary (PLUS, comp_mode, bound, delta);
2597               bound = lowpart_subreg (mode, bound, comp_mode);
2598               tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2599               may_xform = simplify_gen_relational (cond, SImode, mode,
2600                                                    tmp, bound);
2601               may_not_xform = simplify_gen_relational (reverse_condition (cond),
2602                                                        SImode, mode,
2603                                                        tmp, bound);
2604             }
2605         }
2606
2607       if (may_xform != const0_rtx)
2608         {
2609           /* We perform the transformation always provided that it is not
2610              completely senseless.  This is OK, as we would need this assumption
2611              to determine the number of iterations anyway.  */
2612           if (may_xform != const_true_rtx)
2613             {
2614               /* If the step is a power of two and the final value we have
2615                  computed overflows, the cycle is infinite.  Otherwise it
2616                  is nontrivial to compute the number of iterations.  */
2617               if (step_is_pow2)
2618                 desc->infinite = alloc_EXPR_LIST (0, may_not_xform,
2619                                                   desc->infinite);
2620               else
2621                 desc->assumptions = alloc_EXPR_LIST (0, may_xform,
2622                                                      desc->assumptions);
2623             }
2624
2625           /* We are going to lose some information about upper bound on
2626              number of iterations in this step, so record the information
2627              here.  */
2628           inc = INTVAL (iv0.step) - INTVAL (iv1.step);
2629           if (CONST_INT_P (iv1.base))
2630             up = INTVAL (iv1.base);
2631           else
2632             up = INTVAL (mode_mmax) - inc;
2633           down = INTVAL (CONST_INT_P (iv0.base)
2634                          ? iv0.base
2635                          : mode_mmin);
2636           max = (uint64_t) (up - down) / inc + 1;
2637           if (!desc->infinite
2638               && !desc->assumptions)
2639             record_niter_bound (loop, max, false, true);
2640
2641           if (iv0.step == const0_rtx)
2642             {
2643               iv0.base = simplify_gen_binary (PLUS, comp_mode, iv0.base, delta);
2644               iv0.base = simplify_gen_binary (MINUS, comp_mode, iv0.base, step);
2645             }
2646           else
2647             {
2648               iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, delta);
2649               iv1.base = simplify_gen_binary (PLUS, comp_mode, iv1.base, step);
2650             }
2651
2652           tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2653           tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2654           assumption = simplify_gen_relational (reverse_condition (cond),
2655                                                 SImode, mode, tmp0, tmp1);
2656           if (assumption == const_true_rtx)
2657             goto zero_iter_simplify;
2658           else if (assumption != const0_rtx)
2659             desc->noloop_assumptions =
2660                     alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2661           cond = NE;
2662         }
2663     }
2664
2665   /* Count the number of iterations.  */
2666   if (cond == NE)
2667     {
2668       /* Everything we do here is just arithmetics modulo size of mode.  This
2669          makes us able to do more involved computations of number of iterations
2670          than in other cases.  First transform the condition into shape
2671          s * i <> c, with s positive.  */
2672       iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base);
2673       iv0.base = const0_rtx;
2674       iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step);
2675       iv1.step = const0_rtx;
2676       if (INTVAL (iv0.step) < 0)
2677         {
2678           iv0.step = simplify_gen_unary (NEG, comp_mode, iv0.step, comp_mode);
2679           iv1.base = simplify_gen_unary (NEG, comp_mode, iv1.base, comp_mode);
2680         }
2681       iv0.step = lowpart_subreg (mode, iv0.step, comp_mode);
2682
2683       /* Let nsd (s, size of mode) = d.  If d does not divide c, the loop
2684          is infinite.  Otherwise, the number of iterations is
2685          (inverse(s/d) * (c/d)) mod (size of mode/d).  */
2686       s = INTVAL (iv0.step); d = 1;
2687       while (s % 2 != 1)
2688         {
2689           s /= 2;
2690           d *= 2;
2691           size--;
2692         }
2693       bound = GEN_INT (((uint64_t) 1 << (size - 1 ) << 1) - 1);
2694
2695       tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2696       tmp = simplify_gen_binary (UMOD, mode, tmp1, gen_int_mode (d, mode));
2697       assumption = simplify_gen_relational (NE, SImode, mode, tmp, const0_rtx);
2698       desc->infinite = alloc_EXPR_LIST (0, assumption, desc->infinite);
2699
2700       tmp = simplify_gen_binary (UDIV, mode, tmp1, gen_int_mode (d, mode));
2701       inv = inverse (s, size);
2702       tmp = simplify_gen_binary (MULT, mode, tmp, gen_int_mode (inv, mode));
2703       desc->niter_expr = simplify_gen_binary (AND, mode, tmp, bound);
2704     }
2705   else
2706     {
2707       if (iv1.step == const0_rtx)
2708         /* Condition in shape a + s * i <= b
2709            We must know that b + s does not overflow and a <= b + s and then we
2710            can compute number of iterations as (b + s - a) / s.  (It might
2711            seem that we in fact could be more clever about testing the b + s
2712            overflow condition using some information about b - a mod s,
2713            but it was already taken into account during LE -> NE transform).  */
2714         {
2715           step = iv0.step;
2716           tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2717           tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2718
2719           bound = simplify_gen_binary (MINUS, mode, mode_mmax,
2720                                        lowpart_subreg (mode, step,
2721                                                        comp_mode));
2722           if (step_is_pow2)
2723             {
2724               rtx t0, t1;
2725
2726               /* If s is power of 2, we know that the loop is infinite if
2727                  a % s <= b % s and b + s overflows.  */
2728               assumption = simplify_gen_relational (reverse_condition (cond),
2729                                                     SImode, mode,
2730                                                     tmp1, bound);
2731
2732               t0 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp0), step);
2733               t1 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp1), step);
2734               tmp = simplify_gen_relational (cond, SImode, mode, t0, t1);
2735               assumption = simplify_gen_binary (AND, SImode, assumption, tmp);
2736               desc->infinite =
2737                       alloc_EXPR_LIST (0, assumption, desc->infinite);
2738             }
2739           else
2740             {
2741               assumption = simplify_gen_relational (cond, SImode, mode,
2742                                                     tmp1, bound);
2743               desc->assumptions =
2744                       alloc_EXPR_LIST (0, assumption, desc->assumptions);
2745             }
2746
2747           tmp = simplify_gen_binary (PLUS, comp_mode, iv1.base, iv0.step);
2748           tmp = lowpart_subreg (mode, tmp, comp_mode);
2749           assumption = simplify_gen_relational (reverse_condition (cond),
2750                                                 SImode, mode, tmp0, tmp);
2751
2752           delta = simplify_gen_binary (PLUS, mode, tmp1, step);
2753           delta = simplify_gen_binary (MINUS, mode, delta, tmp0);
2754         }
2755       else
2756         {
2757           /* Condition in shape a <= b - s * i
2758              We must know that a - s does not overflow and a - s <= b and then
2759              we can again compute number of iterations as (b - (a - s)) / s.  */
2760           step = simplify_gen_unary (NEG, mode, iv1.step, mode);
2761           tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2762           tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2763
2764           bound = simplify_gen_binary (PLUS, mode, mode_mmin,
2765                                        lowpart_subreg (mode, step, comp_mode));
2766           if (step_is_pow2)
2767             {
2768               rtx t0, t1;
2769
2770               /* If s is power of 2, we know that the loop is infinite if
2771                  a % s <= b % s and a - s overflows.  */
2772               assumption = simplify_gen_relational (reverse_condition (cond),
2773                                                     SImode, mode,
2774                                                     bound, tmp0);
2775
2776               t0 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp0), step);
2777               t1 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp1), step);
2778               tmp = simplify_gen_relational (cond, SImode, mode, t0, t1);
2779               assumption = simplify_gen_binary (AND, SImode, assumption, tmp);
2780               desc->infinite =
2781                       alloc_EXPR_LIST (0, assumption, desc->infinite);
2782             }
2783           else
2784             {
2785               assumption = simplify_gen_relational (cond, SImode, mode,
2786                                                     bound, tmp0);
2787               desc->assumptions =
2788                       alloc_EXPR_LIST (0, assumption, desc->assumptions);
2789             }
2790
2791           tmp = simplify_gen_binary (PLUS, comp_mode, iv0.base, iv1.step);
2792           tmp = lowpart_subreg (mode, tmp, comp_mode);
2793           assumption = simplify_gen_relational (reverse_condition (cond),
2794                                                 SImode, mode,
2795                                                 tmp, tmp1);
2796           delta = simplify_gen_binary (MINUS, mode, tmp0, step);
2797           delta = simplify_gen_binary (MINUS, mode, tmp1, delta);
2798         }
2799       if (assumption == const_true_rtx)
2800         goto zero_iter_simplify;
2801       else if (assumption != const0_rtx)
2802         desc->noloop_assumptions =
2803                 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2804       delta = simplify_gen_binary (UDIV, mode, delta, step);
2805       desc->niter_expr = delta;
2806     }
2807
2808   old_niter = desc->niter_expr;
2809
2810   simplify_using_initial_values (loop, AND, &desc->assumptions);
2811   if (desc->assumptions
2812       && XEXP (desc->assumptions, 0) == const0_rtx)
2813     goto fail;
2814   simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions);
2815   simplify_using_initial_values (loop, IOR, &desc->infinite);
2816   simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr);
2817
2818   /* Rerun the simplification.  Consider code (created by copying loop headers)
2819
2820      i = 0;
2821
2822      if (0 < n)
2823        {
2824          do
2825            {
2826              i++;
2827            } while (i < n);
2828        }
2829
2830     The first pass determines that i = 0, the second pass uses it to eliminate
2831     noloop assumption.  */
2832
2833   simplify_using_initial_values (loop, AND, &desc->assumptions);
2834   if (desc->assumptions
2835       && XEXP (desc->assumptions, 0) == const0_rtx)
2836     goto fail;
2837   simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions);
2838   simplify_using_initial_values (loop, IOR, &desc->infinite);
2839   simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr);
2840
2841   if (desc->noloop_assumptions
2842       && XEXP (desc->noloop_assumptions, 0) == const_true_rtx)
2843     goto zero_iter;
2844
2845   if (CONST_INT_P (desc->niter_expr))
2846     {
2847       uint64_t val = INTVAL (desc->niter_expr);
2848
2849       desc->const_iter = true;
2850       desc->niter = val & GET_MODE_MASK (desc->mode);
2851       if (!desc->infinite
2852           && !desc->assumptions)
2853         record_niter_bound (loop, desc->niter, false, true);
2854     }
2855   else
2856     {
2857       max = determine_max_iter (loop, desc, old_niter);
2858       if (!max)
2859         goto zero_iter_simplify;
2860       if (!desc->infinite
2861           && !desc->assumptions)
2862         record_niter_bound (loop, max, false, true);
2863
2864       /* simplify_using_initial_values does a copy propagation on the registers
2865          in the expression for the number of iterations.  This prolongs life
2866          ranges of registers and increases register pressure, and usually
2867          brings no gain (and if it happens to do, the cse pass will take care
2868          of it anyway).  So prevent this behavior, unless it enabled us to
2869          derive that the number of iterations is a constant.  */
2870       desc->niter_expr = old_niter;
2871     }
2872
2873   return;
2874
2875 zero_iter_simplify:
2876   /* Simplify the assumptions.  */
2877   simplify_using_initial_values (loop, AND, &desc->assumptions);
2878   if (desc->assumptions
2879       && XEXP (desc->assumptions, 0) == const0_rtx)
2880     goto fail;
2881   simplify_using_initial_values (loop, IOR, &desc->infinite);
2882
2883   /* Fallthru.  */
2884 zero_iter:
2885   desc->const_iter = true;
2886   desc->niter = 0;
2887   record_niter_bound (loop, 0, true, true);
2888   desc->noloop_assumptions = NULL_RTX;
2889   desc->niter_expr = const0_rtx;
2890   return;
2891
2892 fail:
2893   desc->simple_p = false;
2894   return;
2895 }
2896
2897 /* Checks whether E is a simple exit from LOOP and stores its description
2898    into DESC.  */
2899
2900 static void
2901 check_simple_exit (struct loop *loop, edge e, struct niter_desc *desc)
2902 {
2903   basic_block exit_bb;
2904   rtx condition;
2905   rtx_insn *at;
2906   edge ein;
2907
2908   exit_bb = e->src;
2909   desc->simple_p = false;
2910
2911   /* It must belong directly to the loop.  */
2912   if (exit_bb->loop_father != loop)
2913     return;
2914
2915   /* It must be tested (at least) once during any iteration.  */
2916   if (!dominated_by_p (CDI_DOMINATORS, loop->latch, exit_bb))
2917     return;
2918
2919   /* It must end in a simple conditional jump.  */
2920   if (!any_condjump_p (BB_END (exit_bb)))
2921     return;
2922
2923   ein = EDGE_SUCC (exit_bb, 0);
2924   if (ein == e)
2925     ein = EDGE_SUCC (exit_bb, 1);
2926
2927   desc->out_edge = e;
2928   desc->in_edge = ein;
2929
2930   /* Test whether the condition is suitable.  */
2931   if (!(condition = get_condition (BB_END (ein->src), &at, false, false)))
2932     return;
2933
2934   if (ein->flags & EDGE_FALLTHRU)
2935     {
2936       condition = reversed_condition (condition);
2937       if (!condition)
2938         return;
2939     }
2940
2941   /* Check that we are able to determine number of iterations and fill
2942      in information about it.  */
2943   iv_number_of_iterations (loop, at, condition, desc);
2944 }
2945
2946 /* Finds a simple exit of LOOP and stores its description into DESC.  */
2947
2948 void
2949 find_simple_exit (struct loop *loop, struct niter_desc *desc)
2950 {
2951   unsigned i;
2952   basic_block *body;
2953   edge e;
2954   struct niter_desc act;
2955   bool any = false;
2956   edge_iterator ei;
2957
2958   desc->simple_p = false;
2959   body = get_loop_body (loop);
2960
2961   for (i = 0; i < loop->num_nodes; i++)
2962     {
2963       FOR_EACH_EDGE (e, ei, body[i]->succs)
2964         {
2965           if (flow_bb_inside_loop_p (loop, e->dest))
2966             continue;
2967
2968           check_simple_exit (loop, e, &act);
2969           if (!act.simple_p)
2970             continue;
2971
2972           if (!any)
2973             any = true;
2974           else
2975             {
2976               /* Prefer constant iterations; the less the better.  */
2977               if (!act.const_iter
2978                   || (desc->const_iter && act.niter >= desc->niter))
2979                 continue;
2980
2981               /* Also if the actual exit may be infinite, while the old one
2982                  not, prefer the old one.  */
2983               if (act.infinite && !desc->infinite)
2984                 continue;
2985             }
2986
2987           *desc = act;
2988         }
2989     }
2990
2991   if (dump_file)
2992     {
2993       if (desc->simple_p)
2994         {
2995           fprintf (dump_file, "Loop %d is simple:\n", loop->num);
2996           fprintf (dump_file, "  simple exit %d -> %d\n",
2997                    desc->out_edge->src->index,
2998                    desc->out_edge->dest->index);
2999           if (desc->assumptions)
3000             {
3001               fprintf (dump_file, "  assumptions: ");
3002               print_rtl (dump_file, desc->assumptions);
3003               fprintf (dump_file, "\n");
3004             }
3005           if (desc->noloop_assumptions)
3006             {
3007               fprintf (dump_file, "  does not roll if: ");
3008               print_rtl (dump_file, desc->noloop_assumptions);
3009               fprintf (dump_file, "\n");
3010             }
3011           if (desc->infinite)
3012             {
3013               fprintf (dump_file, "  infinite if: ");
3014               print_rtl (dump_file, desc->infinite);
3015               fprintf (dump_file, "\n");
3016             }
3017
3018           fprintf (dump_file, "  number of iterations: ");
3019           print_rtl (dump_file, desc->niter_expr);
3020           fprintf (dump_file, "\n");
3021
3022           fprintf (dump_file, "  upper bound: %li\n",
3023                    (long)get_max_loop_iterations_int (loop));
3024           fprintf (dump_file, "  realistic bound: %li\n",
3025                    (long)get_estimated_loop_iterations_int (loop));
3026         }
3027       else
3028         fprintf (dump_file, "Loop %d is not simple.\n", loop->num);
3029     }
3030
3031   free (body);
3032 }
3033
3034 /* Creates a simple loop description of LOOP if it was not computed
3035    already.  */
3036
3037 struct niter_desc *
3038 get_simple_loop_desc (struct loop *loop)
3039 {
3040   struct niter_desc *desc = simple_loop_desc (loop);
3041
3042   if (desc)
3043     return desc;
3044
3045   /* At least desc->infinite is not always initialized by
3046      find_simple_loop_exit.  */
3047   desc = ggc_cleared_alloc<niter_desc> ();
3048   iv_analysis_loop_init (loop);
3049   find_simple_exit (loop, desc);
3050   loop->simple_loop_desc = desc;
3051
3052   if (desc->simple_p && (desc->assumptions || desc->infinite))
3053     {
3054       const char *wording;
3055
3056       /* Assume that no overflow happens and that the loop is finite.
3057          We already warned at the tree level if we ran optimizations there.  */
3058       if (!flag_tree_loop_optimize && warn_unsafe_loop_optimizations)
3059         {
3060           if (desc->infinite)
3061             {
3062               wording =
3063                 flag_unsafe_loop_optimizations
3064                 ? N_("assuming that the loop is not infinite")
3065                 : N_("cannot optimize possibly infinite loops");
3066               warning (OPT_Wunsafe_loop_optimizations, "%s",
3067                        gettext (wording));
3068             }
3069           if (desc->assumptions)
3070             {
3071               wording =
3072                 flag_unsafe_loop_optimizations
3073                 ? N_("assuming that the loop counter does not overflow")
3074                 : N_("cannot optimize loop, the loop counter may overflow");
3075               warning (OPT_Wunsafe_loop_optimizations, "%s",
3076                        gettext (wording));
3077             }
3078         }
3079
3080       if (flag_unsafe_loop_optimizations)
3081         {
3082           desc->assumptions = NULL_RTX;
3083           desc->infinite = NULL_RTX;
3084         }
3085     }
3086
3087   return desc;
3088 }
3089
3090 /* Releases simple loop description for LOOP.  */
3091
3092 void
3093 free_simple_loop_desc (struct loop *loop)
3094 {
3095   struct niter_desc *desc = simple_loop_desc (loop);
3096
3097   if (!desc)
3098     return;
3099
3100   ggc_free (desc);
3101   loop->simple_loop_desc = NULL;
3102 }