gcc/loop-iv.c

   1 /* Rtl-level induction variable analysis.
   2    Copyright (C) 2004, 2005 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the
   8 Free Software Foundation; either version 2, or (at your option) any
   9 later version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT
  12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING.  If not, write to the Free
  18 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
  19 02110-1301, USA.  */
  20
  21 /* This is a simple analysis of induction variables of the loop.  The major use
  22    is for determining the number of iterations of a loop for loop unrolling,
  23    doloop optimization and branch prediction.  The iv information is computed
  24    on demand.
  25
  26    Induction variable is analyzed by walking the use-def chains.  When a biv
  27    is found, it is cached in the bivs hash table.  When register is proved
  28    to be a giv, its description is stored to DF_REF_DATA of the def reference.
  29
  30    The analysis works always with one loop -- you must call
  31    iv_analysis_loop_init (loop) for it.  All the other functions then work with
  32    this loop.   When you need to work with another loop, just call
  33    iv_analysis_loop_init for it.  When you no longer need iv analysis, call
  34    iv_analysis_done () to clean up the memory.
  35
  36    The available functions are:
  37
  38    iv_analyze (insn, reg, iv): Stores the description of the induction variable
  39      corresponding to the use of register REG in INSN to IV.  Returns true if
  40      REG is an induction variable in INSN. false otherwise.
  41      If use of REG is not found in INSN, following insns are scanned (so that
  42      we may call this function on insn returned by get_condition).
  43    iv_analyze_result (insn, def, iv):  Stores to IV the description of the iv
  44      corresponding to DEF, which is a register defined in INSN.
  45    iv_analyze_expr (insn, rhs, mode, iv):  Stores to IV the description of iv
  46      corresponding to expression EXPR evaluated at INSN.  All registers used bu
  47      EXPR must also be used in INSN.
  48    iv_current_loop_df (): Returns the dataflow object for the current loop used
  49      by iv analysis.  */
  50
  51 #include "config.h"
  52 #include "system.h"
  53 #include "coretypes.h"
  54 #include "tm.h"
  55 #include "rtl.h"
  56 #include "hard-reg-set.h"
  57 #include "obstack.h"
  58 #include "basic-block.h"
  59 #include "cfgloop.h"
  60 #include "expr.h"
  61 #include "intl.h"
  62 #include "output.h"
  63 #include "toplev.h"
  64 #include "df.h"
  65 #include "hashtab.h"
  66
  67 /* Possible return values of iv_get_reaching_def.  */
  68
  69 enum iv_grd_result
  70 {
  71   /* More than one reaching def, or reaching def that does not
  72      dominate the use.  */
  73   GRD_INVALID,
  74
  75   /* The use is trivial invariant of the loop, i.e. is not changed
  76      inside the loop.  */
  77   GRD_INVARIANT,
  78
  79   /* The use is reached by initial value and a value from the
  80      previous iteration.  */
  81   GRD_MAYBE_BIV,
  82
  83   /* The use has single dominating def.  */
  84   GRD_SINGLE_DOM
  85 };
  86
  87 /* Information about a biv.  */
  88
  89 struct biv_entry
  90 {
  91   unsigned regno;       /* The register of the biv.  */
  92   struct rtx_iv iv;     /* Value of the biv.  */
  93 };
  94
  95 /* Induction variable stored at the reference.  */
  96 #define DF_REF_IV(REF) ((struct rtx_iv *) DF_REF_DATA (REF))
  97 #define DF_REF_IV_SET(REF, IV) DF_REF_DATA (REF) = (IV)
  98
  99 /* The current loop.  */
 100
 101 static struct loop *current_loop;
 102
 103 /* Dataflow information for the current loop.  */
 104
 105 static struct df *df = NULL;
 106
 107 /* Bivs of the current loop.  */
 108
 109 static htab_t bivs;
 110
 111 /* Return the dataflow object for the current loop.  */
 112 struct df *
 113 iv_current_loop_df (void)
 114 {
 115   return df;
 116 }
 117
 118 static bool iv_analyze_op (rtx, rtx, struct rtx_iv *);
 119
 120 /* Dumps information about IV to FILE.  */
 121
 122 extern void dump_iv_info (FILE *, struct rtx_iv *);
 123 void
 124 dump_iv_info (FILE *file, struct rtx_iv *iv)
 125 {
 126   if (!iv->base)
 127     {
 128       fprintf (file, "not simple");
 129       return;
 130     }
 131
 132   if (iv->step == const0_rtx
 133       && !iv->first_special)
 134     fprintf (file, "invariant ");
 135
 136   print_rtl (file, iv->base);
 137   if (iv->step != const0_rtx)
 138     {
 139       fprintf (file, " + ");
 140       print_rtl (file, iv->step);
 141       fprintf (file, " * iteration");
 142     }
 143   fprintf (file, " (in %s)", GET_MODE_NAME (iv->mode));
 144
 145   if (iv->mode != iv->extend_mode)
 146     fprintf (file, " %s to %s",
 147              rtx_name[iv->extend],
 148              GET_MODE_NAME (iv->extend_mode));
 149
 150   if (iv->mult != const1_rtx)
 151     {
 152       fprintf (file, " * ");
 153       print_rtl (file, iv->mult);
 154     }
 155   if (iv->delta != const0_rtx)
 156     {
 157       fprintf (file, " + ");
 158       print_rtl (file, iv->delta);
 159     }
 160   if (iv->first_special)
 161     fprintf (file, " (first special)");
 162 }
 163
 164 /* Generates a subreg to get the least significant part of EXPR (in mode
 165    INNER_MODE) to OUTER_MODE.  */
 166
 167 rtx
 168 lowpart_subreg (enum machine_mode outer_mode, rtx expr,
 169                 enum machine_mode inner_mode)
 170 {
 171   return simplify_gen_subreg (outer_mode, expr, inner_mode,
 172                               subreg_lowpart_offset (outer_mode, inner_mode));
 173 }
 174
 175 /* Checks whether REG is a well-behaved register.  */
 176
 177 static bool
 178 simple_reg_p (rtx reg)
 179 {
 180   unsigned r;
 181
 182   if (GET_CODE (reg) == SUBREG)
 183     {
 184       if (!subreg_lowpart_p (reg))
 185         return false;
 186       reg = SUBREG_REG (reg);
 187     }
 188
 189   if (!REG_P (reg))
 190     return false;
 191
 192   r = REGNO (reg);
 193   if (HARD_REGISTER_NUM_P (r))
 194     return false;
 195
 196   if (GET_MODE_CLASS (GET_MODE (reg)) != MODE_INT)
 197     return false;
 198
 199   return true;
 200 }
 201
 202 /* Clears the information about ivs stored in df.  */
 203
 204 static void
 205 clear_iv_info (void)
 206 {
 207   unsigned i, n_defs = DF_DEFS_SIZE (df);
 208   struct rtx_iv *iv;
 209   struct df_ref *def;
 210
 211   for (i = 0; i < n_defs; i++)
 212     {
 213       def = DF_DEFS_GET (df, i);
 214       iv = DF_REF_IV (def);
 215       if (!iv)
 216         continue;
 217       free (iv);
 218       DF_REF_IV_SET (def, NULL);
 219     }
 220
 221   htab_empty (bivs);
 222 }
 223
 224 /* Returns hash value for biv B.  */
 225
 226 static hashval_t
 227 biv_hash (const void *b)
 228 {
 229   return ((const struct biv_entry *) b)->regno;
 230 }
 231
 232 /* Compares biv B and register R.  */
 233
 234 static int
 235 biv_eq (const void *b, const void *r)
 236 {
 237   return ((const struct biv_entry *) b)->regno == REGNO ((rtx) r);
 238 }
 239
 240 /* Prepare the data for an induction variable analysis of a LOOP.  */
 241
 242 void
 243 iv_analysis_loop_init (struct loop *loop)
 244 {
 245   basic_block *body = get_loop_body_in_dom_order (loop), bb;
 246   bitmap blocks = BITMAP_ALLOC (NULL);
 247   unsigned i;
 248   bool first_time = (df == NULL);
 249
 250   current_loop = loop;
 251
 252   /* Clear the information from the analysis of the previous loop.  */
 253   if (first_time)
 254     {
 255       df = df_init (DF_HARD_REGS | DF_EQUIV_NOTES);
 256       df_chain_add_problem (df, DF_UD_CHAIN);
 257       bivs = htab_create (10, biv_hash, biv_eq, free);
 258     }
 259   else
 260     clear_iv_info ();
 261
 262   for (i = 0; i < loop->num_nodes; i++)
 263     {
 264       bb = body[i];
 265       bitmap_set_bit (blocks, bb->index);
 266     }
 267   df_set_blocks (df, blocks);
 268   df_analyze (df);
 269   BITMAP_FREE (blocks);
 270   free (body);
 271 }
 272
 273 /* Finds the definition of REG that dominates loop latch and stores
 274    it to DEF.  Returns false if there is not a single definition
 275    dominating the latch.  If REG has no definition in loop, DEF
 276    is set to NULL and true is returned.  */
 277
 278 static bool
 279 latch_dominating_def (rtx reg, struct df_ref **def)
 280 {
 281   struct df_ref *single_rd = NULL, *adef;
 282   unsigned regno = REGNO (reg);
 283   struct df_reg_info *reg_info = DF_REG_DEF_GET (df, regno);
 284   struct df_rd_bb_info *bb_info = DF_RD_BB_INFO (df, current_loop->latch);
 285
 286   for (adef = reg_info->reg_chain; adef; adef = adef->next_reg)
 287     {
 288       if (!bitmap_bit_p (bb_info->out, DF_REF_ID (adef)))
 289         continue;
 290
 291       /* More than one reaching definition.  */
 292       if (single_rd)
 293         return false;
 294
 295       if (!just_once_each_iteration_p (current_loop, DF_REF_BB (adef)))
 296         return false;
 297
 298       single_rd = adef;
 299     }
 300
 301   *def = single_rd;
 302   return true;
 303 }
 304
 305 /* Gets definition of REG reaching its use in INSN and stores it to DEF.  */
 306
 307 static enum iv_grd_result
 308 iv_get_reaching_def (rtx insn, rtx reg, struct df_ref **def)
 309 {
 310   struct df_ref *use, *adef;
 311   basic_block def_bb, use_bb;
 312   rtx def_insn;
 313   bool dom_p;
 314
 315   *def = NULL;
 316   if (!simple_reg_p (reg))
 317     return GRD_INVALID;
 318   if (GET_CODE (reg) == SUBREG)
 319     reg = SUBREG_REG (reg);
 320   gcc_assert (REG_P (reg));
 321
 322   use = df_find_use (df, insn, reg);
 323   gcc_assert (use != NULL);
 324
 325   if (!DF_REF_CHAIN (use))
 326     return GRD_INVARIANT;
 327
 328   /* More than one reaching def.  */
 329   if (DF_REF_CHAIN (use)->next)
 330     return GRD_INVALID;
 331
 332   adef = DF_REF_CHAIN (use)->ref;
 333   def_insn = DF_REF_INSN (adef);
 334   def_bb = DF_REF_BB (adef);
 335   use_bb = BLOCK_FOR_INSN (insn);
 336
 337   if (use_bb == def_bb)
 338     dom_p = (DF_INSN_LUID (df, def_insn) < DF_INSN_LUID (df, insn));
 339   else
 340     dom_p = dominated_by_p (CDI_DOMINATORS, use_bb, def_bb);
 341
 342   if (dom_p)
 343     {
 344       *def = adef;
 345       return GRD_SINGLE_DOM;
 346     }
 347
 348   /* The definition does not dominate the use.  This is still OK if
 349      this may be a use of a biv, i.e. if the def_bb dominates loop
 350      latch.  */
 351   if (just_once_each_iteration_p (current_loop, def_bb))
 352     return GRD_MAYBE_BIV;
 353
 354   return GRD_INVALID;
 355 }
 356
 357 /* Sets IV to invariant CST in MODE.  Always returns true (just for
 358    consistency with other iv manipulation functions that may fail).  */
 359
 360 static bool
 361 iv_constant (struct rtx_iv *iv, rtx cst, enum machine_mode mode)
 362 {
 363   if (mode == VOIDmode)
 364     mode = GET_MODE (cst);
 365
 366   iv->mode = mode;
 367   iv->base = cst;
 368   iv->step = const0_rtx;
 369   iv->first_special = false;
 370   iv->extend = UNKNOWN;
 371   iv->extend_mode = iv->mode;
 372   iv->delta = const0_rtx;
 373   iv->mult = const1_rtx;
 374
 375   return true;
 376 }
 377
 378 /* Evaluates application of subreg to MODE on IV.  */
 379
 380 static bool
 381 iv_subreg (struct rtx_iv *iv, enum machine_mode mode)
 382 {
 383   /* If iv is invariant, just calculate the new value.  */
 384   if (iv->step == const0_rtx
 385       && !iv->first_special)
 386     {
 387       rtx val = get_iv_value (iv, const0_rtx);
 388       val = lowpart_subreg (mode, val, iv->extend_mode);
 389
 390       iv->base = val;
 391       iv->extend = UNKNOWN;
 392       iv->mode = iv->extend_mode = mode;
 393       iv->delta = const0_rtx;
 394       iv->mult = const1_rtx;
 395       return true;
 396     }
 397
 398   if (iv->extend_mode == mode)
 399     return true;
 400
 401   if (GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (iv->mode))
 402     return false;
 403
 404   iv->extend = UNKNOWN;
 405   iv->mode = mode;
 406
 407   iv->base = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta,
 408                                   simplify_gen_binary (MULT, iv->extend_mode,
 409                                                        iv->base, iv->mult));
 410   iv->step = simplify_gen_binary (MULT, iv->extend_mode, iv->step, iv->mult);
 411   iv->mult = const1_rtx;
 412   iv->delta = const0_rtx;
 413   iv->first_special = false;
 414
 415   return true;
 416 }
 417
 418 /* Evaluates application of EXTEND to MODE on IV.  */
 419
 420 static bool
 421 iv_extend (struct rtx_iv *iv, enum rtx_code extend, enum machine_mode mode)
 422 {
 423   /* If iv is invariant, just calculate the new value.  */
 424   if (iv->step == const0_rtx
 425       && !iv->first_special)
 426     {
 427       rtx val = get_iv_value (iv, const0_rtx);
 428       val = simplify_gen_unary (extend, mode, val, iv->extend_mode);
 429
 430       iv->base = val;
 431       iv->extend = UNKNOWN;
 432       iv->mode = iv->extend_mode = mode;
 433       iv->delta = const0_rtx;
 434       iv->mult = const1_rtx;
 435       return true;
 436     }
 437
 438   if (mode != iv->extend_mode)
 439     return false;
 440
 441   if (iv->extend != UNKNOWN
 442       && iv->extend != extend)
 443     return false;
 444
 445   iv->extend = extend;
 446
 447   return true;
 448 }
 449
 450 /* Evaluates negation of IV.  */
 451
 452 static bool
 453 iv_neg (struct rtx_iv *iv)
 454 {
 455   if (iv->extend == UNKNOWN)
 456     {
 457       iv->base = simplify_gen_unary (NEG, iv->extend_mode,
 458                                      iv->base, iv->extend_mode);
 459       iv->step = simplify_gen_unary (NEG, iv->extend_mode,
 460                                      iv->step, iv->extend_mode);
 461     }
 462   else
 463     {
 464       iv->delta = simplify_gen_unary (NEG, iv->extend_mode,
 465                                       iv->delta, iv->extend_mode);
 466       iv->mult = simplify_gen_unary (NEG, iv->extend_mode,
 467                                      iv->mult, iv->extend_mode);
 468     }
 469
 470   return true;
 471 }
 472
 473 /* Evaluates addition or subtraction (according to OP) of IV1 to IV0.  */
 474
 475 static bool
 476 iv_add (struct rtx_iv *iv0, struct rtx_iv *iv1, enum rtx_code op)
 477 {
 478   enum machine_mode mode;
 479   rtx arg;
 480
 481   /* Extend the constant to extend_mode of the other operand if necessary.  */
 482   if (iv0->extend == UNKNOWN
 483       && iv0->mode == iv0->extend_mode
 484       && iv0->step == const0_rtx
 485       && GET_MODE_SIZE (iv0->extend_mode) < GET_MODE_SIZE (iv1->extend_mode))
 486     {
 487       iv0->extend_mode = iv1->extend_mode;
 488       iv0->base = simplify_gen_unary (ZERO_EXTEND, iv0->extend_mode,
 489                                       iv0->base, iv0->mode);
 490     }
 491   if (iv1->extend == UNKNOWN
 492       && iv1->mode == iv1->extend_mode
 493       && iv1->step == const0_rtx
 494       && GET_MODE_SIZE (iv1->extend_mode) < GET_MODE_SIZE (iv0->extend_mode))
 495     {
 496       iv1->extend_mode = iv0->extend_mode;
 497       iv1->base = simplify_gen_unary (ZERO_EXTEND, iv1->extend_mode,
 498                                       iv1->base, iv1->mode);
 499     }
 500
 501   mode = iv0->extend_mode;
 502   if (mode != iv1->extend_mode)
 503     return false;
 504
 505   if (iv0->extend == UNKNOWN && iv1->extend == UNKNOWN)
 506     {
 507       if (iv0->mode != iv1->mode)
 508         return false;
 509
 510       iv0->base = simplify_gen_binary (op, mode, iv0->base, iv1->base);
 511       iv0->step = simplify_gen_binary (op, mode, iv0->step, iv1->step);
 512
 513       return true;
 514     }
 515
 516   /* Handle addition of constant.  */
 517   if (iv1->extend == UNKNOWN
 518       && iv1->mode == mode
 519       && iv1->step == const0_rtx)
 520     {
 521       iv0->delta = simplify_gen_binary (op, mode, iv0->delta, iv1->base);
 522       return true;
 523     }
 524
 525   if (iv0->extend == UNKNOWN
 526       && iv0->mode == mode
 527       && iv0->step == const0_rtx)
 528     {
 529       arg = iv0->base;
 530       *iv0 = *iv1;
 531       if (op == MINUS
 532           && !iv_neg (iv0))
 533         return false;
 534
 535       iv0->delta = simplify_gen_binary (PLUS, mode, iv0->delta, arg);
 536       return true;
 537     }
 538
 539   return false;
 540 }
 541
 542 /* Evaluates multiplication of IV by constant CST.  */
 543
 544 static bool
 545 iv_mult (struct rtx_iv *iv, rtx mby)
 546 {
 547   enum machine_mode mode = iv->extend_mode;
 548
 549   if (GET_MODE (mby) != VOIDmode
 550       && GET_MODE (mby) != mode)
 551     return false;
 552
 553   if (iv->extend == UNKNOWN)
 554     {
 555       iv->base = simplify_gen_binary (MULT, mode, iv->base, mby);
 556       iv->step = simplify_gen_binary (MULT, mode, iv->step, mby);
 557     }
 558   else
 559     {
 560       iv->delta = simplify_gen_binary (MULT, mode, iv->delta, mby);
 561       iv->mult = simplify_gen_binary (MULT, mode, iv->mult, mby);
 562     }
 563
 564   return true;
 565 }
 566
 567 /* Evaluates shift of IV by constant CST.  */
 568
 569 static bool
 570 iv_shift (struct rtx_iv *iv, rtx mby)
 571 {
 572   enum machine_mode mode = iv->extend_mode;
 573
 574   if (GET_MODE (mby) != VOIDmode
 575       && GET_MODE (mby) != mode)
 576     return false;
 577
 578   if (iv->extend == UNKNOWN)
 579     {
 580       iv->base = simplify_gen_binary (ASHIFT, mode, iv->base, mby);
 581       iv->step = simplify_gen_binary (ASHIFT, mode, iv->step, mby);
 582     }
 583   else
 584     {
 585       iv->delta = simplify_gen_binary (ASHIFT, mode, iv->delta, mby);
 586       iv->mult = simplify_gen_binary (ASHIFT, mode, iv->mult, mby);
 587     }
 588
 589   return true;
 590 }
 591
 592 /* The recursive part of get_biv_step.  Gets the value of the single value
 593    defined by DEF wrto initial value of REG inside loop, in shape described
 594    at get_biv_step.  */
 595
 596 static bool
 597 get_biv_step_1 (struct df_ref *def, rtx reg,
 598                 rtx *inner_step, enum machine_mode *inner_mode,
 599                 enum rtx_code *extend, enum machine_mode outer_mode,
 600                 rtx *outer_step)
 601 {
 602   rtx set, rhs, op0 = NULL_RTX, op1 = NULL_RTX;
 603   rtx next, nextr, tmp;
 604   enum rtx_code code;
 605   rtx insn = DF_REF_INSN (def);
 606   struct df_ref *next_def;
 607   enum iv_grd_result res;
 608
 609   set = single_set (insn);
 610   if (!set)
 611     return false;
 612
 613   rhs = find_reg_equal_equiv_note (insn);
 614   if (rhs)
 615     rhs = XEXP (rhs, 0);
 616   else
 617     rhs = SET_SRC (set);
 618
 619   code = GET_CODE (rhs);
 620   switch (code)
 621     {
 622     case SUBREG:
 623     case REG:
 624       next = rhs;
 625       break;
 626
 627     case PLUS:
 628     case MINUS:
 629       op0 = XEXP (rhs, 0);
 630       op1 = XEXP (rhs, 1);
 631
 632       if (code == PLUS && CONSTANT_P (op0))
 633         {
 634           tmp = op0; op0 = op1; op1 = tmp;
 635         }
 636
 637       if (!simple_reg_p (op0)
 638           || !CONSTANT_P (op1))
 639         return false;
 640
 641       if (GET_MODE (rhs) != outer_mode)
 642         {
 643           /* ppc64 uses expressions like
 644
 645              (set x:SI (plus:SI (subreg:SI y:DI) 1)).
 646
 647              this is equivalent to
 648
 649              (set x':DI (plus:DI y:DI 1))
 650              (set x:SI (subreg:SI (x':DI)).  */
 651           if (GET_CODE (op0) != SUBREG)
 652             return false;
 653           if (GET_MODE (SUBREG_REG (op0)) != outer_mode)
 654             return false;
 655         }
 656
 657       next = op0;
 658       break;
 659
 660     case SIGN_EXTEND:
 661     case ZERO_EXTEND:
 662       if (GET_MODE (rhs) != outer_mode)
 663         return false;
 664
 665       op0 = XEXP (rhs, 0);
 666       if (!simple_reg_p (op0))
 667         return false;
 668
 669       next = op0;
 670       break;
 671
 672     default:
 673       return false;
 674     }
 675
 676   if (GET_CODE (next) == SUBREG)
 677     {
 678       if (!subreg_lowpart_p (next))
 679         return false;
 680
 681       nextr = SUBREG_REG (next);
 682       if (GET_MODE (nextr) != outer_mode)
 683         return false;
 684     }
 685   else
 686     nextr = next;
 687
 688   res = iv_get_reaching_def (insn, nextr, &next_def);
 689
 690   if (res == GRD_INVALID || res == GRD_INVARIANT)
 691     return false;
 692
 693   if (res == GRD_MAYBE_BIV)
 694     {
 695       if (!rtx_equal_p (nextr, reg))
 696         return false;
 697
 698       *inner_step = const0_rtx;
 699       *extend = UNKNOWN;
 700       *inner_mode = outer_mode;
 701       *outer_step = const0_rtx;
 702     }
 703   else if (!get_biv_step_1 (next_def, reg,
 704                             inner_step, inner_mode, extend, outer_mode,
 705                             outer_step))
 706     return false;
 707
 708   if (GET_CODE (next) == SUBREG)
 709     {
 710       enum machine_mode amode = GET_MODE (next);
 711
 712       if (GET_MODE_SIZE (amode) > GET_MODE_SIZE (*inner_mode))
 713         return false;
 714
 715       *inner_mode = amode;
 716       *inner_step = simplify_gen_binary (PLUS, outer_mode,
 717                                          *inner_step, *outer_step);
 718       *outer_step = const0_rtx;
 719       *extend = UNKNOWN;
 720     }
 721
 722   switch (code)
 723     {
 724     case REG:
 725     case SUBREG:
 726       break;
 727
 728     case PLUS:
 729     case MINUS:
 730       if (*inner_mode == outer_mode
 731           /* See comment in previous switch.  */
 732           || GET_MODE (rhs) != outer_mode)
 733         *inner_step = simplify_gen_binary (code, outer_mode,
 734                                            *inner_step, op1);
 735       else
 736         *outer_step = simplify_gen_binary (code, outer_mode,
 737                                            *outer_step, op1);
 738       break;
 739
 740     case SIGN_EXTEND:
 741     case ZERO_EXTEND:
 742       gcc_assert (GET_MODE (op0) == *inner_mode
 743                   && *extend == UNKNOWN
 744                   && *outer_step == const0_rtx);
 745
 746       *extend = code;
 747       break;
 748
 749     default:
 750       return false;
 751     }
 752
 753   return true;
 754 }
 755
 756 /* Gets the operation on register REG inside loop, in shape
 757
 758    OUTER_STEP + EXTEND_{OUTER_MODE} (SUBREG_{INNER_MODE} (REG + INNER_STEP))
 759
 760    If the operation cannot be described in this shape, return false.
 761    LAST_DEF is the definition of REG that dominates loop latch.  */
 762
 763 static bool
 764 get_biv_step (struct df_ref *last_def, rtx reg, rtx *inner_step,
 765               enum machine_mode *inner_mode, enum rtx_code *extend,
 766               enum machine_mode *outer_mode, rtx *outer_step)
 767 {
 768   *outer_mode = GET_MODE (reg);
 769
 770   if (!get_biv_step_1 (last_def, reg,
 771                        inner_step, inner_mode, extend, *outer_mode,
 772                        outer_step))
 773     return false;
 774
 775   gcc_assert ((*inner_mode == *outer_mode) != (*extend != UNKNOWN));
 776   gcc_assert (*inner_mode != *outer_mode || *outer_step == const0_rtx);
 777
 778   return true;
 779 }
 780
 781 /* Records information that DEF is induction variable IV.  */
 782
 783 static void
 784 record_iv (struct df_ref *def, struct rtx_iv *iv)
 785 {
 786   struct rtx_iv *recorded_iv = XNEW (struct rtx_iv);
 787
 788   *recorded_iv = *iv;
 789   DF_REF_IV_SET (def, recorded_iv);
 790 }
 791
 792 /* If DEF was already analyzed for bivness, store the description of the biv to
 793    IV and return true.  Otherwise return false.  */
 794
 795 static bool
 796 analyzed_for_bivness_p (rtx def, struct rtx_iv *iv)
 797 {
 798   struct biv_entry *biv = htab_find_with_hash (bivs, def, REGNO (def));
 799
 800   if (!biv)
 801     return false;
 802
 803   *iv = biv->iv;
 804   return true;
 805 }
 806
 807 static void
 808 record_biv (rtx def, struct rtx_iv *iv)
 809 {
 810   struct biv_entry *biv = XNEW (struct biv_entry);
 811   void **slot = htab_find_slot_with_hash (bivs, def, REGNO (def), INSERT);
 812
 813   biv->regno = REGNO (def);
 814   biv->iv = *iv;
 815   gcc_assert (!*slot);
 816   *slot = biv;
 817 }
 818
 819 /* Determines whether DEF is a biv and if so, stores its description
 820    to *IV.  */
 821
 822 static bool
 823 iv_analyze_biv (rtx def, struct rtx_iv *iv)
 824 {
 825   rtx inner_step, outer_step;
 826   enum machine_mode inner_mode, outer_mode;
 827   enum rtx_code extend;
 828   struct df_ref *last_def;
 829
 830   if (dump_file)
 831     {
 832       fprintf (dump_file, "Analyzing ");
 833       print_rtl (dump_file, def);
 834       fprintf (dump_file, " for bivness.\n");
 835     }
 836
 837   if (!REG_P (def))
 838     {
 839       if (!CONSTANT_P (def))
 840         return false;
 841
 842       return iv_constant (iv, def, VOIDmode);
 843     }
 844
 845   if (!latch_dominating_def (def, &last_def))
 846     {
 847       if (dump_file)
 848         fprintf (dump_file, "  not simple.\n");
 849       return false;
 850     }
 851
 852   if (!last_def)
 853     return iv_constant (iv, def, VOIDmode);
 854
 855   if (analyzed_for_bivness_p (def, iv))
 856     {
 857       if (dump_file)
 858         fprintf (dump_file, "  already analysed.\n");
 859       return iv->base != NULL_RTX;
 860     }
 861
 862   if (!get_biv_step (last_def, def, &inner_step, &inner_mode, &extend,
 863                      &outer_mode, &outer_step))
 864     {
 865       iv->base = NULL_RTX;
 866       goto end;
 867     }
 868
 869   /* Loop transforms base to es (base + inner_step) + outer_step,
 870      where es means extend of subreg between inner_mode and outer_mode.
 871      The corresponding induction variable is
 872
 873      es ((base - outer_step) + i * (inner_step + outer_step)) + outer_step  */
 874
 875   iv->base = simplify_gen_binary (MINUS, outer_mode, def, outer_step);
 876   iv->step = simplify_gen_binary (PLUS, outer_mode, inner_step, outer_step);
 877   iv->mode = inner_mode;
 878   iv->extend_mode = outer_mode;
 879   iv->extend = extend;
 880   iv->mult = const1_rtx;
 881   iv->delta = outer_step;
 882   iv->first_special = inner_mode != outer_mode;
 883
 884  end:
 885   if (dump_file)
 886     {
 887       fprintf (dump_file, "  ");
 888       dump_iv_info (dump_file, iv);
 889       fprintf (dump_file, "\n");
 890     }
 891
 892   record_biv (def, iv);
 893   return iv->base != NULL_RTX;
 894 }
 895
 896 /* Analyzes expression RHS used at INSN and stores the result to *IV.
 897    The mode of the induction variable is MODE.  */
 898
 899 bool
 900 iv_analyze_expr (rtx insn, rtx rhs, enum machine_mode mode, struct rtx_iv *iv)
 901 {
 902   rtx mby = NULL_RTX, tmp;
 903   rtx op0 = NULL_RTX, op1 = NULL_RTX;
 904   struct rtx_iv iv0, iv1;
 905   enum rtx_code code = GET_CODE (rhs);
 906   enum machine_mode omode = mode;
 907
 908   iv->mode = VOIDmode;
 909   iv->base = NULL_RTX;
 910   iv->step = NULL_RTX;
 911
 912   gcc_assert (GET_MODE (rhs) == mode || GET_MODE (rhs) == VOIDmode);
 913
 914   if (CONSTANT_P (rhs)
 915       || REG_P (rhs)
 916       || code == SUBREG)
 917     {
 918       if (!iv_analyze_op (insn, rhs, iv))
 919         return false;
 920
 921       if (iv->mode == VOIDmode)
 922         {
 923           iv->mode = mode;
 924           iv->extend_mode = mode;
 925         }
 926
 927       return true;
 928     }
 929
 930   switch (code)
 931     {
 932     case REG:
 933       op0 = rhs;
 934       break;
 935
 936     case SIGN_EXTEND:
 937     case ZERO_EXTEND:
 938     case NEG:
 939       op0 = XEXP (rhs, 0);
 940       omode = GET_MODE (op0);
 941       break;
 942
 943     case PLUS:
 944     case MINUS:
 945       op0 = XEXP (rhs, 0);
 946       op1 = XEXP (rhs, 1);
 947       break;
 948
 949     case MULT:
 950       op0 = XEXP (rhs, 0);
 951       mby = XEXP (rhs, 1);
 952       if (!CONSTANT_P (mby))
 953         {
 954           tmp = op0;
 955           op0 = mby;
 956           mby = tmp;
 957         }
 958       if (!CONSTANT_P (mby))
 959         return false;
 960       break;
 961
 962     case ASHIFT:
 963       op0 = XEXP (rhs, 0);
 964       mby = XEXP (rhs, 1);
 965       if (!CONSTANT_P (mby))
 966         return false;
 967       break;
 968
 969     default:
 970       return false;
 971     }
 972
 973   if (op0
 974       && !iv_analyze_expr (insn, op0, omode, &iv0))
 975     return false;
 976
 977   if (op1
 978       && !iv_analyze_expr (insn, op1, omode, &iv1))
 979     return false;
 980
 981   switch (code)
 982     {
 983     case SIGN_EXTEND:
 984     case ZERO_EXTEND:
 985       if (!iv_extend (&iv0, code, mode))
 986         return false;
 987       break;
 988
 989     case NEG:
 990       if (!iv_neg (&iv0))
 991         return false;
 992       break;
 993
 994     case PLUS:
 995     case MINUS:
 996       if (!iv_add (&iv0, &iv1, code))
 997         return false;
 998       break;
 999
1000     case MULT:
1001       if (!iv_mult (&iv0, mby))
1002         return false;
1003       break;
1004
1005     case ASHIFT:
1006       if (!iv_shift (&iv0, mby))
1007         return false;
1008       break;
1009
1010     default:
1011       break;
1012     }
1013
1014   *iv = iv0;
1015   return iv->base != NULL_RTX;
1016 }
1017
1018 /* Analyzes iv DEF and stores the result to *IV.  */
1019
1020 static bool
1021 iv_analyze_def (struct df_ref *def, struct rtx_iv *iv)
1022 {
1023   rtx insn = DF_REF_INSN (def);
1024   rtx reg = DF_REF_REG (def);
1025   rtx set, rhs;
1026
1027   if (dump_file)
1028     {
1029       fprintf (dump_file, "Analysing def of ");
1030       print_rtl (dump_file, reg);
1031       fprintf (dump_file, " in insn ");
1032       print_rtl_single (dump_file, insn);
1033     }
1034
1035   if (DF_REF_IV (def))
1036     {
1037       if (dump_file)
1038         fprintf (dump_file, "  already analysed.\n");
1039       *iv = *DF_REF_IV (def);
1040       return iv->base != NULL_RTX;
1041     }
1042
1043   iv->mode = VOIDmode;
1044   iv->base = NULL_RTX;
1045   iv->step = NULL_RTX;
1046
1047   set = single_set (insn);
1048   if (!set || SET_DEST (set) != reg)
1049     return false;
1050
1051   rhs = find_reg_equal_equiv_note (insn);
1052   if (rhs)
1053     rhs = XEXP (rhs, 0);
1054   else
1055     rhs = SET_SRC (set);
1056
1057   iv_analyze_expr (insn, rhs, GET_MODE (reg), iv);
1058   record_iv (def, iv);
1059
1060   if (dump_file)
1061     {
1062       print_rtl (dump_file, reg);
1063       fprintf (dump_file, " in insn ");
1064       print_rtl_single (dump_file, insn);
1065       fprintf (dump_file, "  is ");
1066       dump_iv_info (dump_file, iv);
1067       fprintf (dump_file, "\n");
1068     }
1069
1070   return iv->base != NULL_RTX;
1071 }
1072
1073 /* Analyzes operand OP of INSN and stores the result to *IV.  */
1074
1075 static bool
1076 iv_analyze_op (rtx insn, rtx op, struct rtx_iv *iv)
1077 {
1078   struct df_ref *def = NULL;
1079   enum iv_grd_result res;
1080
1081   if (dump_file)
1082     {
1083       fprintf (dump_file, "Analysing operand ");
1084       print_rtl (dump_file, op);
1085       fprintf (dump_file, " of insn ");
1086       print_rtl_single (dump_file, insn);
1087     }
1088
1089   if (CONSTANT_P (op))
1090     res = GRD_INVARIANT;
1091   else if (GET_CODE (op) == SUBREG)
1092     {
1093       if (!subreg_lowpart_p (op))
1094         return false;
1095
1096       if (!iv_analyze_op (insn, SUBREG_REG (op), iv))
1097         return false;
1098
1099       return iv_subreg (iv, GET_MODE (op));
1100     }
1101   else
1102     {
1103       res = iv_get_reaching_def (insn, op, &def);
1104       if (res == GRD_INVALID)
1105         {
1106           if (dump_file)
1107             fprintf (dump_file, "  not simple.\n");
1108           return false;
1109         }
1110     }
1111
1112   if (res == GRD_INVARIANT)
1113     {
1114       iv_constant (iv, op, VOIDmode);
1115
1116       if (dump_file)
1117         {
1118           fprintf (dump_file, "  ");
1119           dump_iv_info (dump_file, iv);
1120           fprintf (dump_file, "\n");
1121         }
1122       return true;
1123     }
1124
1125   if (res == GRD_MAYBE_BIV)
1126     return iv_analyze_biv (op, iv);
1127
1128   return iv_analyze_def (def, iv);
1129 }
1130
1131 /* Analyzes value VAL at INSN and stores the result to *IV.  */
1132
1133 bool
1134 iv_analyze (rtx insn, rtx val, struct rtx_iv *iv)
1135 {
1136   rtx reg;
1137
1138   /* We must find the insn in that val is used, so that we get to UD chains.
1139      Since the function is sometimes called on result of get_condition,
1140      this does not necessarily have to be directly INSN; scan also the
1141      following insns.  */
1142   if (simple_reg_p (val))
1143     {
1144       if (GET_CODE (val) == SUBREG)
1145         reg = SUBREG_REG (val);
1146       else
1147         reg = val;
1148
1149       while (!df_find_use (df, insn, reg))
1150         insn = NEXT_INSN (insn);
1151     }
1152
1153   return iv_analyze_op (insn, val, iv);
1154 }
1155
1156 /* Analyzes definition of DEF in INSN and stores the result to IV.  */
1157
1158 bool
1159 iv_analyze_result (rtx insn, rtx def, struct rtx_iv *iv)
1160 {
1161   struct df_ref *adef;
1162
1163   adef = df_find_def (df, insn, def);
1164   if (!adef)
1165     return false;
1166
1167   return iv_analyze_def (adef, iv);
1168 }
1169
1170 /* Checks whether definition of register REG in INSN is a basic induction
1171    variable.  IV analysis must have been initialized (via a call to
1172    iv_analysis_loop_init) for this function to produce a result.  */
1173
1174 bool
1175 biv_p (rtx insn, rtx reg)
1176 {
1177   struct rtx_iv iv;
1178   struct df_ref *def, *last_def;
1179
1180   if (!simple_reg_p (reg))
1181     return false;
1182
1183   def = df_find_def (df, insn, reg);
1184   gcc_assert (def != NULL);
1185   if (!latch_dominating_def (reg, &last_def))
1186     return false;
1187   if (last_def != def)
1188     return false;
1189
1190   if (!iv_analyze_biv (reg, &iv))
1191     return false;
1192
1193   return iv.step != const0_rtx;
1194 }
1195
1196 /* Calculates value of IV at ITERATION-th iteration.  */
1197
1198 rtx
1199 get_iv_value (struct rtx_iv *iv, rtx iteration)
1200 {
1201   rtx val;
1202
1203   /* We would need to generate some if_then_else patterns, and so far
1204      it is not needed anywhere.  */
1205   gcc_assert (!iv->first_special);
1206
1207   if (iv->step != const0_rtx && iteration != const0_rtx)
1208     val = simplify_gen_binary (PLUS, iv->extend_mode, iv->base,
1209                                simplify_gen_binary (MULT, iv->extend_mode,
1210                                                     iv->step, iteration));
1211   else
1212     val = iv->base;
1213
1214   if (iv->extend_mode == iv->mode)
1215     return val;
1216
1217   val = lowpart_subreg (iv->mode, val, iv->extend_mode);
1218
1219   if (iv->extend == UNKNOWN)
1220     return val;
1221
1222   val = simplify_gen_unary (iv->extend, iv->extend_mode, val, iv->mode);
1223   val = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta,
1224                              simplify_gen_binary (MULT, iv->extend_mode,
1225                                                   iv->mult, val));
1226
1227   return val;
1228 }
1229
1230 /* Free the data for an induction variable analysis.  */
1231
1232 void
1233 iv_analysis_done (void)
1234 {
1235   if (df)
1236     {
1237       clear_iv_info ();
1238       df_finish (df);
1239       df = NULL;
1240       htab_delete (bivs);
1241       bivs = NULL;
1242     }
1243 }
1244
1245 /* Computes inverse to X modulo (1 << MOD).  */
1246
1247 static unsigned HOST_WIDEST_INT
1248 inverse (unsigned HOST_WIDEST_INT x, int mod)
1249 {
1250   unsigned HOST_WIDEST_INT mask =
1251           ((unsigned HOST_WIDEST_INT) 1 << (mod - 1) << 1) - 1;
1252   unsigned HOST_WIDEST_INT rslt = 1;
1253   int i;
1254
1255   for (i = 0; i < mod - 1; i++)
1256     {
1257       rslt = (rslt * x) & mask;
1258       x = (x * x) & mask;
1259     }
1260
1261   return rslt;
1262 }
1263
1264 /* Tries to estimate the maximum number of iterations.  */
1265
1266 static unsigned HOST_WIDEST_INT
1267 determine_max_iter (struct niter_desc *desc)
1268 {
1269   rtx niter = desc->niter_expr;
1270   rtx mmin, mmax, left, right;
1271   unsigned HOST_WIDEST_INT nmax, inc;
1272
1273   if (GET_CODE (niter) == AND
1274       && GET_CODE (XEXP (niter, 0)) == CONST_INT)
1275     {
1276       nmax = INTVAL (XEXP (niter, 0));
1277       if (!(nmax & (nmax + 1)))
1278         {
1279           desc->niter_max = nmax;
1280           return nmax;
1281         }
1282     }
1283
1284   get_mode_bounds (desc->mode, desc->signed_p, desc->mode, &mmin, &mmax);
1285   nmax = INTVAL (mmax) - INTVAL (mmin);
1286
1287   if (GET_CODE (niter) == UDIV)
1288     {
1289       if (GET_CODE (XEXP (niter, 1)) != CONST_INT)
1290         {
1291           desc->niter_max = nmax;
1292           return nmax;
1293         }
1294       inc = INTVAL (XEXP (niter, 1));
1295       niter = XEXP (niter, 0);
1296     }
1297   else
1298     inc = 1;
1299
1300   if (GET_CODE (niter) == PLUS)
1301     {
1302       left = XEXP (niter, 0);
1303       right = XEXP (niter, 0);
1304
1305       if (GET_CODE (right) == CONST_INT)
1306         right = GEN_INT (-INTVAL (right));
1307     }
1308   else if (GET_CODE (niter) == MINUS)
1309     {
1310       left = XEXP (niter, 0);
1311       right = XEXP (niter, 0);
1312     }
1313   else
1314     {
1315       left = niter;
1316       right = mmin;
1317     }
1318
1319   if (GET_CODE (left) == CONST_INT)
1320     mmax = left;
1321   if (GET_CODE (right) == CONST_INT)
1322     mmin = right;
1323   nmax = INTVAL (mmax) - INTVAL (mmin);
1324
1325   desc->niter_max = nmax / inc;
1326   return nmax / inc;
1327 }
1328
1329 /* Checks whether register *REG is in set ALT.  Callback for for_each_rtx.  */
1330
1331 static int
1332 altered_reg_used (rtx *reg, void *alt)
1333 {
1334   if (!REG_P (*reg))
1335     return 0;
1336
1337   return REGNO_REG_SET_P (alt, REGNO (*reg));
1338 }
1339
1340 /* Marks registers altered by EXPR in set ALT.  */
1341
1342 static void
1343 mark_altered (rtx expr, rtx by ATTRIBUTE_UNUSED, void *alt)
1344 {
1345   if (GET_CODE (expr) == SUBREG)
1346     expr = SUBREG_REG (expr);
1347   if (!REG_P (expr))
1348     return;
1349
1350   SET_REGNO_REG_SET (alt, REGNO (expr));
1351 }
1352
1353 /* Checks whether RHS is simple enough to process.  */
1354
1355 static bool
1356 simple_rhs_p (rtx rhs)
1357 {
1358   rtx op0, op1;
1359
1360   if (CONSTANT_P (rhs)
1361       || REG_P (rhs))
1362     return true;
1363
1364   switch (GET_CODE (rhs))
1365     {
1366     case PLUS:
1367     case MINUS:
1368       op0 = XEXP (rhs, 0);
1369       op1 = XEXP (rhs, 1);
1370       /* Allow reg + const sets only.  */
1371       if (REG_P (op0) && CONSTANT_P (op1))
1372         return true;
1373       if (REG_P (op1) && CONSTANT_P (op0))
1374         return true;
1375
1376       return false;
1377
1378     default:
1379       return false;
1380     }
1381 }
1382
1383 /* Simplifies *EXPR using assignment in INSN.  ALTERED is the set of registers
1384    altered so far.  */
1385
1386 static void
1387 simplify_using_assignment (rtx insn, rtx *expr, regset altered)
1388 {
1389   rtx set = single_set (insn);
1390   rtx lhs = NULL_RTX, rhs;
1391   bool ret = false;
1392
1393   if (set)
1394     {
1395       lhs = SET_DEST (set);
1396       if (!REG_P (lhs)
1397           || altered_reg_used (&lhs, altered))
1398         ret = true;
1399     }
1400   else
1401     ret = true;
1402
1403   note_stores (PATTERN (insn), mark_altered, altered);
1404   if (CALL_P (insn))
1405     {
1406       int i;
1407       HARD_REG_SET clobbered_regs;
1408
1409       /* Kill all call clobbered registers.  */
1410       get_call_invalidated_used_regs (insn, &clobbered_regs, true);
1411       for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1412         if (TEST_HARD_REG_BIT (clobbered_regs, i))
1413           SET_REGNO_REG_SET (altered, i);
1414     }
1415
1416   if (ret)
1417     return;
1418
1419   rhs = find_reg_equal_equiv_note (insn);
1420   if (rhs)
1421     rhs = XEXP (rhs, 0);
1422   else
1423     rhs = SET_SRC (set);
1424
1425   if (!simple_rhs_p (rhs))
1426     return;
1427
1428   if (for_each_rtx (&rhs, altered_reg_used, altered))
1429     return;
1430
1431   *expr = simplify_replace_rtx (*expr, lhs, rhs);
1432 }
1433
1434 /* Checks whether A implies B.  */
1435
1436 static bool
1437 implies_p (rtx a, rtx b)
1438 {
1439   rtx op0, op1, opb0, opb1, r;
1440   enum machine_mode mode;
1441
1442   if (GET_CODE (a) == EQ)
1443     {
1444       op0 = XEXP (a, 0);
1445       op1 = XEXP (a, 1);
1446
1447       if (REG_P (op0))
1448         {
1449           r = simplify_replace_rtx (b, op0, op1);
1450           if (r == const_true_rtx)
1451             return true;
1452         }
1453
1454       if (REG_P (op1))
1455         {
1456           r = simplify_replace_rtx (b, op1, op0);
1457           if (r == const_true_rtx)
1458             return true;
1459         }
1460     }
1461
1462   /* A < B implies A + 1 <= B.  */
1463   if ((GET_CODE (a) == GT || GET_CODE (a) == LT)
1464       && (GET_CODE (b) == GE || GET_CODE (b) == LE))
1465     {
1466       op0 = XEXP (a, 0);
1467       op1 = XEXP (a, 1);
1468       opb0 = XEXP (b, 0);
1469       opb1 = XEXP (b, 1);
1470
1471       if (GET_CODE (a) == GT)
1472         {
1473           r = op0;
1474           op0 = op1;
1475           op1 = r;
1476         }
1477
1478       if (GET_CODE (b) == GE)
1479         {
1480           r = opb0;
1481           opb0 = opb1;
1482           opb1 = r;
1483         }
1484
1485       mode = GET_MODE (op0);
1486       if (mode != GET_MODE (opb0))
1487         mode = VOIDmode;
1488       else if (mode == VOIDmode)
1489         {
1490           mode = GET_MODE (op1);
1491           if (mode != GET_MODE (opb1))
1492             mode = VOIDmode;
1493         }
1494
1495       if (SCALAR_INT_MODE_P (mode)
1496           && rtx_equal_p (op1, opb1)
1497           && simplify_gen_binary (MINUS, mode, opb0, op0) == const1_rtx)
1498         return true;
1499     }
1500
1501   return false;
1502 }
1503
1504 /* Canonicalizes COND so that
1505
1506    (1) Ensure that operands are ordered according to
1507        swap_commutative_operands_p.
1508    (2) (LE x const) will be replaced with (LT x <const+1>) and similarly
1509        for GE, GEU, and LEU.  */
1510
1511 rtx
1512 canon_condition (rtx cond)
1513 {
1514   rtx tem;
1515   rtx op0, op1;
1516   enum rtx_code code;
1517   enum machine_mode mode;
1518
1519   code = GET_CODE (cond);
1520   op0 = XEXP (cond, 0);
1521   op1 = XEXP (cond, 1);
1522
1523   if (swap_commutative_operands_p (op0, op1))
1524     {
1525       code = swap_condition (code);
1526       tem = op0;
1527       op0 = op1;
1528       op1 = tem;
1529     }
1530
1531   mode = GET_MODE (op0);
1532   if (mode == VOIDmode)
1533     mode = GET_MODE (op1);
1534   gcc_assert (mode != VOIDmode);
1535
1536   if (GET_CODE (op1) == CONST_INT
1537       && GET_MODE_CLASS (mode) != MODE_CC
1538       && GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
1539     {
1540       HOST_WIDE_INT const_val = INTVAL (op1);
1541       unsigned HOST_WIDE_INT uconst_val = const_val;
1542       unsigned HOST_WIDE_INT max_val
1543         = (unsigned HOST_WIDE_INT) GET_MODE_MASK (mode);
1544
1545       switch (code)
1546         {
1547         case LE:
1548           if ((unsigned HOST_WIDE_INT) const_val != max_val >> 1)
1549             code = LT, op1 = gen_int_mode (const_val + 1, GET_MODE (op0));
1550           break;
1551
1552         /* When cross-compiling, const_val might be sign-extended from
1553            BITS_PER_WORD to HOST_BITS_PER_WIDE_INT */
1554         case GE:
1555           if ((HOST_WIDE_INT) (const_val & max_val)
1556               != (((HOST_WIDE_INT) 1
1557                    << (GET_MODE_BITSIZE (GET_MODE (op0)) - 1))))
1558             code = GT, op1 = gen_int_mode (const_val - 1, mode);
1559           break;
1560
1561         case LEU:
1562           if (uconst_val < max_val)
1563             code = LTU, op1 = gen_int_mode (uconst_val + 1, mode);
1564           break;
1565
1566         case GEU:
1567           if (uconst_val != 0)
1568             code = GTU, op1 = gen_int_mode (uconst_val - 1, mode);
1569           break;
1570
1571         default:
1572           break;
1573         }
1574     }
1575
1576   if (op0 != XEXP (cond, 0)
1577       || op1 != XEXP (cond, 1)
1578       || code != GET_CODE (cond)
1579       || GET_MODE (cond) != SImode)
1580     cond = gen_rtx_fmt_ee (code, SImode, op0, op1);
1581
1582   return cond;
1583 }
1584
1585 /* Tries to use the fact that COND holds to simplify EXPR.  ALTERED is the
1586    set of altered regs.  */
1587
1588 void
1589 simplify_using_condition (rtx cond, rtx *expr, regset altered)
1590 {
1591   rtx rev, reve, exp = *expr;
1592
1593   if (!COMPARISON_P (exp))
1594     return;
1595
1596   /* If some register gets altered later, we do not really speak about its
1597      value at the time of comparison.  */
1598   if (altered
1599       && for_each_rtx (&cond, altered_reg_used, altered))
1600     return;
1601
1602   rev = reversed_condition (cond);
1603   reve = reversed_condition (exp);
1604
1605   cond = canon_condition (cond);
1606   exp = canon_condition (exp);
1607   if (rev)
1608     rev = canon_condition (rev);
1609   if (reve)
1610     reve = canon_condition (reve);
1611
1612   if (rtx_equal_p (exp, cond))
1613     {
1614       *expr = const_true_rtx;
1615       return;
1616     }
1617
1618
1619   if (rev && rtx_equal_p (exp, rev))
1620     {
1621       *expr = const0_rtx;
1622       return;
1623     }
1624
1625   if (implies_p (cond, exp))
1626     {
1627       *expr = const_true_rtx;
1628       return;
1629     }
1630
1631   if (reve && implies_p (cond, reve))
1632     {
1633       *expr = const0_rtx;
1634       return;
1635     }
1636
1637   /* A proof by contradiction.  If *EXPR implies (not cond), *EXPR must
1638      be false.  */
1639   if (rev && implies_p (exp, rev))
1640     {
1641       *expr = const0_rtx;
1642       return;
1643     }
1644
1645   /* Similarly, If (not *EXPR) implies (not cond), *EXPR must be true.  */
1646   if (rev && reve && implies_p (reve, rev))
1647     {
1648       *expr = const_true_rtx;
1649       return;
1650     }
1651
1652   /* We would like to have some other tests here.  TODO.  */
1653
1654   return;
1655 }
1656
1657 /* Use relationship between A and *B to eventually eliminate *B.
1658    OP is the operation we consider.  */
1659
1660 static void
1661 eliminate_implied_condition (enum rtx_code op, rtx a, rtx *b)
1662 {
1663   switch (op)
1664     {
1665     case AND:
1666       /* If A implies *B, we may replace *B by true.  */
1667       if (implies_p (a, *b))
1668         *b = const_true_rtx;
1669       break;
1670
1671     case IOR:
1672       /* If *B implies A, we may replace *B by false.  */
1673       if (implies_p (*b, a))
1674         *b = const0_rtx;
1675       break;
1676
1677     default:
1678       gcc_unreachable ();
1679     }
1680 }
1681
1682 /* Eliminates the conditions in TAIL that are implied by HEAD.  OP is the
1683    operation we consider.  */
1684
1685 static void
1686 eliminate_implied_conditions (enum rtx_code op, rtx *head, rtx tail)
1687 {
1688   rtx elt;
1689
1690   for (elt = tail; elt; elt = XEXP (elt, 1))
1691     eliminate_implied_condition (op, *head, &XEXP (elt, 0));
1692   for (elt = tail; elt; elt = XEXP (elt, 1))
1693     eliminate_implied_condition (op, XEXP (elt, 0), head);
1694 }
1695
1696 /* Simplifies *EXPR using initial values at the start of the LOOP.  If *EXPR
1697    is a list, its elements are assumed to be combined using OP.  */
1698
1699 static void
1700 simplify_using_initial_values (struct loop *loop, enum rtx_code op, rtx *expr)
1701 {
1702   rtx head, tail, insn;
1703   rtx neutral, aggr;
1704   regset altered;
1705   edge e;
1706
1707   if (!*expr)
1708     return;
1709
1710   if (CONSTANT_P (*expr))
1711     return;
1712
1713   if (GET_CODE (*expr) == EXPR_LIST)
1714     {
1715       head = XEXP (*expr, 0);
1716       tail = XEXP (*expr, 1);
1717
1718       eliminate_implied_conditions (op, &head, tail);
1719
1720       switch (op)
1721         {
1722         case AND:
1723           neutral = const_true_rtx;
1724           aggr = const0_rtx;
1725           break;
1726
1727         case IOR:
1728           neutral = const0_rtx;
1729           aggr = const_true_rtx;
1730           break;
1731
1732         default:
1733           gcc_unreachable ();
1734         }
1735
1736       simplify_using_initial_values (loop, UNKNOWN, &head);
1737       if (head == aggr)
1738         {
1739           XEXP (*expr, 0) = aggr;
1740           XEXP (*expr, 1) = NULL_RTX;
1741           return;
1742         }
1743       else if (head == neutral)
1744         {
1745           *expr = tail;
1746           simplify_using_initial_values (loop, op, expr);
1747           return;
1748         }
1749       simplify_using_initial_values (loop, op, &tail);
1750
1751       if (tail && XEXP (tail, 0) == aggr)
1752         {
1753           *expr = tail;
1754           return;
1755         }
1756
1757       XEXP (*expr, 0) = head;
1758       XEXP (*expr, 1) = tail;
1759       return;
1760     }
1761
1762   gcc_assert (op == UNKNOWN);
1763
1764   e = loop_preheader_edge (loop);
1765   if (e->src == ENTRY_BLOCK_PTR)
1766     return;
1767
1768   altered = ALLOC_REG_SET (&reg_obstack);
1769
1770   while (1)
1771     {
1772       insn = BB_END (e->src);
1773       if (any_condjump_p (insn))
1774         {
1775           rtx cond = get_condition (BB_END (e->src), NULL, false, true);
1776
1777           if (cond && (e->flags & EDGE_FALLTHRU))
1778             cond = reversed_condition (cond);
1779           if (cond)
1780             {
1781               simplify_using_condition (cond, expr, altered);
1782               if (CONSTANT_P (*expr))
1783                 {
1784                   FREE_REG_SET (altered);
1785                   return;
1786                 }
1787             }
1788         }
1789
1790       FOR_BB_INSNS_REVERSE (e->src, insn)
1791         {
1792           if (!INSN_P (insn))
1793             continue;
1794
1795           simplify_using_assignment (insn, expr, altered);
1796           if (CONSTANT_P (*expr))
1797             {
1798               FREE_REG_SET (altered);
1799               return;
1800             }
1801         }
1802
1803       if (!single_pred_p (e->src)
1804           || single_pred (e->src) == ENTRY_BLOCK_PTR)
1805         break;
1806       e = single_pred_edge (e->src);
1807     }
1808
1809   FREE_REG_SET (altered);
1810 }
1811
1812 /* Transforms invariant IV into MODE.  Adds assumptions based on the fact
1813    that IV occurs as left operands of comparison COND and its signedness
1814    is SIGNED_P to DESC.  */
1815
1816 static void
1817 shorten_into_mode (struct rtx_iv *iv, enum machine_mode mode,
1818                    enum rtx_code cond, bool signed_p, struct niter_desc *desc)
1819 {
1820   rtx mmin, mmax, cond_over, cond_under;
1821
1822   get_mode_bounds (mode, signed_p, iv->extend_mode, &mmin, &mmax);
1823   cond_under = simplify_gen_relational (LT, SImode, iv->extend_mode,
1824                                         iv->base, mmin);
1825   cond_over = simplify_gen_relational (GT, SImode, iv->extend_mode,
1826                                        iv->base, mmax);
1827
1828   switch (cond)
1829     {
1830       case LE:
1831       case LT:
1832       case LEU:
1833       case LTU:
1834         if (cond_under != const0_rtx)
1835           desc->infinite =
1836                   alloc_EXPR_LIST (0, cond_under, desc->infinite);
1837         if (cond_over != const0_rtx)
1838           desc->noloop_assumptions =
1839                   alloc_EXPR_LIST (0, cond_over, desc->noloop_assumptions);
1840         break;
1841
1842       case GE:
1843       case GT:
1844       case GEU:
1845       case GTU:
1846         if (cond_over != const0_rtx)
1847           desc->infinite =
1848                   alloc_EXPR_LIST (0, cond_over, desc->infinite);
1849         if (cond_under != const0_rtx)
1850           desc->noloop_assumptions =
1851                   alloc_EXPR_LIST (0, cond_under, desc->noloop_assumptions);
1852         break;
1853
1854       case NE:
1855         if (cond_over != const0_rtx)
1856           desc->infinite =
1857                   alloc_EXPR_LIST (0, cond_over, desc->infinite);
1858         if (cond_under != const0_rtx)
1859           desc->infinite =
1860                   alloc_EXPR_LIST (0, cond_under, desc->infinite);
1861         break;
1862
1863       default:
1864         gcc_unreachable ();
1865     }
1866
1867   iv->mode = mode;
1868   iv->extend = signed_p ? SIGN_EXTEND : ZERO_EXTEND;
1869 }
1870
1871 /* Transforms IV0 and IV1 compared by COND so that they are both compared as
1872    subregs of the same mode if possible (sometimes it is necessary to add
1873    some assumptions to DESC).  */
1874
1875 static bool
1876 canonicalize_iv_subregs (struct rtx_iv *iv0, struct rtx_iv *iv1,
1877                          enum rtx_code cond, struct niter_desc *desc)
1878 {
1879   enum machine_mode comp_mode;
1880   bool signed_p;
1881
1882   /* If the ivs behave specially in the first iteration, or are
1883      added/multiplied after extending, we ignore them.  */
1884   if (iv0->first_special || iv0->mult != const1_rtx || iv0->delta != const0_rtx)
1885     return false;
1886   if (iv1->first_special || iv1->mult != const1_rtx || iv1->delta != const0_rtx)
1887     return false;
1888
1889   /* If there is some extend, it must match signedness of the comparison.  */
1890   switch (cond)
1891     {
1892       case LE:
1893       case LT:
1894         if (iv0->extend == ZERO_EXTEND
1895             || iv1->extend == ZERO_EXTEND)
1896           return false;
1897         signed_p = true;
1898         break;
1899
1900       case LEU:
1901       case LTU:
1902         if (iv0->extend == SIGN_EXTEND
1903             || iv1->extend == SIGN_EXTEND)
1904           return false;
1905         signed_p = false;
1906         break;
1907
1908       case NE:
1909         if (iv0->extend != UNKNOWN
1910             && iv1->extend != UNKNOWN
1911             && iv0->extend != iv1->extend)
1912           return false;
1913
1914         signed_p = false;
1915         if (iv0->extend != UNKNOWN)
1916           signed_p = iv0->extend == SIGN_EXTEND;
1917         if (iv1->extend != UNKNOWN)
1918           signed_p = iv1->extend == SIGN_EXTEND;
1919         break;
1920
1921       default:
1922         gcc_unreachable ();
1923     }
1924
1925   /* Values of both variables should be computed in the same mode.  These
1926      might indeed be different, if we have comparison like
1927
1928      (compare (subreg:SI (iv0)) (subreg:SI (iv1)))
1929
1930      and iv0 and iv1 are both ivs iterating in SI mode, but calculated
1931      in different modes.  This does not seem impossible to handle, but
1932      it hardly ever occurs in practice.
1933
1934      The only exception is the case when one of operands is invariant.
1935      For example pentium 3 generates comparisons like
1936      (lt (subreg:HI (reg:SI)) 100).  Here we assign HImode to 100, but we
1937      definitely do not want this prevent the optimization.  */
1938   comp_mode = iv0->extend_mode;
1939   if (GET_MODE_BITSIZE (comp_mode) < GET_MODE_BITSIZE (iv1->extend_mode))
1940     comp_mode = iv1->extend_mode;
1941
1942   if (iv0->extend_mode != comp_mode)
1943     {
1944       if (iv0->mode != iv0->extend_mode
1945           || iv0->step != const0_rtx)
1946         return false;
1947
1948       iv0->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND,
1949                                       comp_mode, iv0->base, iv0->mode);
1950       iv0->extend_mode = comp_mode;
1951     }
1952
1953   if (iv1->extend_mode != comp_mode)
1954     {
1955       if (iv1->mode != iv1->extend_mode
1956           || iv1->step != const0_rtx)
1957         return false;
1958
1959       iv1->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND,
1960                                       comp_mode, iv1->base, iv1->mode);
1961       iv1->extend_mode = comp_mode;
1962     }
1963
1964   /* Check that both ivs belong to a range of a single mode.  If one of the
1965      operands is an invariant, we may need to shorten it into the common
1966      mode.  */
1967   if (iv0->mode == iv0->extend_mode
1968       && iv0->step == const0_rtx
1969       && iv0->mode != iv1->mode)
1970     shorten_into_mode (iv0, iv1->mode, cond, signed_p, desc);
1971
1972   if (iv1->mode == iv1->extend_mode
1973       && iv1->step == const0_rtx
1974       && iv0->mode != iv1->mode)
1975     shorten_into_mode (iv1, iv0->mode, swap_condition (cond), signed_p, desc);
1976
1977   if (iv0->mode != iv1->mode)
1978     return false;
1979
1980   desc->mode = iv0->mode;
1981   desc->signed_p = signed_p;
1982
1983   return true;
1984 }
1985
1986 /* Computes number of iterations of the CONDITION in INSN in LOOP and stores
1987    the result into DESC.  Very similar to determine_number_of_iterations
1988    (basically its rtl version), complicated by things like subregs.  */
1989
1990 static void
1991 iv_number_of_iterations (struct loop *loop, rtx insn, rtx condition,
1992                          struct niter_desc *desc)
1993 {
1994   rtx op0, op1, delta, step, bound, may_xform, tmp, tmp0, tmp1;
1995   struct rtx_iv iv0, iv1, tmp_iv;
1996   rtx assumption, may_not_xform;
1997   enum rtx_code cond;
1998   enum machine_mode mode, comp_mode;
1999   rtx mmin, mmax, mode_mmin, mode_mmax;
2000   unsigned HOST_WIDEST_INT s, size, d, inv;
2001   HOST_WIDEST_INT up, down, inc, step_val;
2002   int was_sharp = false;
2003   rtx old_niter;
2004   bool step_is_pow2;
2005
2006   /* The meaning of these assumptions is this:
2007      if !assumptions
2008        then the rest of information does not have to be valid
2009      if noloop_assumptions then the loop does not roll
2010      if infinite then this exit is never used */
2011
2012   desc->assumptions = NULL_RTX;
2013   desc->noloop_assumptions = NULL_RTX;
2014   desc->infinite = NULL_RTX;
2015   desc->simple_p = true;
2016
2017   desc->const_iter = false;
2018   desc->niter_expr = NULL_RTX;
2019   desc->niter_max = 0;
2020
2021   cond = GET_CODE (condition);
2022   gcc_assert (COMPARISON_P (condition));
2023
2024   mode = GET_MODE (XEXP (condition, 0));
2025   if (mode == VOIDmode)
2026     mode = GET_MODE (XEXP (condition, 1));
2027   /* The constant comparisons should be folded.  */
2028   gcc_assert (mode != VOIDmode);
2029
2030   /* We only handle integers or pointers.  */
2031   if (GET_MODE_CLASS (mode) != MODE_INT
2032       && GET_MODE_CLASS (mode) != MODE_PARTIAL_INT)
2033     goto fail;
2034
2035   op0 = XEXP (condition, 0);
2036   if (!iv_analyze (insn, op0, &iv0))
2037     goto fail;
2038   if (iv0.extend_mode == VOIDmode)
2039     iv0.mode = iv0.extend_mode = mode;
2040
2041   op1 = XEXP (condition, 1);
2042   if (!iv_analyze (insn, op1, &iv1))
2043     goto fail;
2044   if (iv1.extend_mode == VOIDmode)
2045     iv1.mode = iv1.extend_mode = mode;
2046
2047   if (GET_MODE_BITSIZE (iv0.extend_mode) > HOST_BITS_PER_WIDE_INT
2048       || GET_MODE_BITSIZE (iv1.extend_mode) > HOST_BITS_PER_WIDE_INT)
2049     goto fail;
2050
2051   /* Check condition and normalize it.  */
2052
2053   switch (cond)
2054     {
2055       case GE:
2056       case GT:
2057       case GEU:
2058       case GTU:
2059         tmp_iv = iv0; iv0 = iv1; iv1 = tmp_iv;
2060         cond = swap_condition (cond);
2061         break;
2062       case NE:
2063       case LE:
2064       case LEU:
2065       case LT:
2066       case LTU:
2067         break;
2068       default:
2069         goto fail;
2070     }
2071
2072   /* Handle extends.  This is relatively nontrivial, so we only try in some
2073      easy cases, when we can canonicalize the ivs (possibly by adding some
2074      assumptions) to shape subreg (base + i * step).  This function also fills
2075      in desc->mode and desc->signed_p.  */
2076
2077   if (!canonicalize_iv_subregs (&iv0, &iv1, cond, desc))
2078     goto fail;
2079
2080   comp_mode = iv0.extend_mode;
2081   mode = iv0.mode;
2082   size = GET_MODE_BITSIZE (mode);
2083   get_mode_bounds (mode, (cond == LE || cond == LT), comp_mode, &mmin, &mmax);
2084   mode_mmin = lowpart_subreg (mode, mmin, comp_mode);
2085   mode_mmax = lowpart_subreg (mode, mmax, comp_mode);
2086
2087   if (GET_CODE (iv0.step) != CONST_INT || GET_CODE (iv1.step) != CONST_INT)
2088     goto fail;
2089
2090   /* We can take care of the case of two induction variables chasing each other
2091      if the test is NE. I have never seen a loop using it, but still it is
2092      cool.  */
2093   if (iv0.step != const0_rtx && iv1.step != const0_rtx)
2094     {
2095       if (cond != NE)
2096         goto fail;
2097
2098       iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step);
2099       iv1.step = const0_rtx;
2100     }
2101
2102   /* This is either infinite loop or the one that ends immediately, depending
2103      on initial values.  Unswitching should remove this kind of conditions.  */
2104   if (iv0.step == const0_rtx && iv1.step == const0_rtx)
2105     goto fail;
2106
2107   if (cond != NE)
2108     {
2109       if (iv0.step == const0_rtx)
2110         step_val = -INTVAL (iv1.step);
2111       else
2112         step_val = INTVAL (iv0.step);
2113
2114       /* Ignore loops of while (i-- < 10) type.  */
2115       if (step_val < 0)
2116         goto fail;
2117
2118       step_is_pow2 = !(step_val & (step_val - 1));
2119     }
2120   else
2121     {
2122       /* We do not care about whether the step is power of two in this
2123          case.  */
2124       step_is_pow2 = false;
2125       step_val = 0;
2126     }
2127
2128   /* Some more condition normalization.  We must record some assumptions
2129      due to overflows.  */
2130   switch (cond)
2131     {
2132       case LT:
2133       case LTU:
2134         /* We want to take care only of non-sharp relationals; this is easy,
2135            as in cases the overflow would make the transformation unsafe
2136            the loop does not roll.  Seemingly it would make more sense to want
2137            to take care of sharp relationals instead, as NE is more similar to
2138            them, but the problem is that here the transformation would be more
2139            difficult due to possibly infinite loops.  */
2140         if (iv0.step == const0_rtx)
2141           {
2142             tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2143             assumption = simplify_gen_relational (EQ, SImode, mode, tmp,
2144                                                   mode_mmax);
2145             if (assumption == const_true_rtx)
2146               goto zero_iter_simplify;
2147             iv0.base = simplify_gen_binary (PLUS, comp_mode,
2148                                             iv0.base, const1_rtx);
2149           }
2150         else
2151           {
2152             tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2153             assumption = simplify_gen_relational (EQ, SImode, mode, tmp,
2154                                                   mode_mmin);
2155             if (assumption == const_true_rtx)
2156               goto zero_iter_simplify;
2157             iv1.base = simplify_gen_binary (PLUS, comp_mode,
2158                                             iv1.base, constm1_rtx);
2159           }
2160
2161         if (assumption != const0_rtx)
2162           desc->noloop_assumptions =
2163                   alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2164         cond = (cond == LT) ? LE : LEU;
2165
2166         /* It will be useful to be able to tell the difference once more in
2167            LE -> NE reduction.  */
2168         was_sharp = true;
2169         break;
2170       default: ;
2171     }
2172
2173   /* Take care of trivially infinite loops.  */
2174   if (cond != NE)
2175     {
2176       if (iv0.step == const0_rtx)
2177         {
2178           tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2179           if (rtx_equal_p (tmp, mode_mmin))
2180             {
2181               desc->infinite =
2182                       alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX);
2183               /* Fill in the remaining fields somehow.  */
2184               goto zero_iter_simplify;
2185             }
2186         }
2187       else
2188         {
2189           tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2190           if (rtx_equal_p (tmp, mode_mmax))
2191             {
2192               desc->infinite =
2193                       alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX);
2194               /* Fill in the remaining fields somehow.  */
2195               goto zero_iter_simplify;
2196             }
2197         }
2198     }
2199
2200   /* If we can we want to take care of NE conditions instead of size
2201      comparisons, as they are much more friendly (most importantly
2202      this takes care of special handling of loops with step 1).  We can
2203      do it if we first check that upper bound is greater or equal to
2204      lower bound, their difference is constant c modulo step and that
2205      there is not an overflow.  */
2206   if (cond != NE)
2207     {
2208       if (iv0.step == const0_rtx)
2209         step = simplify_gen_unary (NEG, comp_mode, iv1.step, comp_mode);
2210       else
2211         step = iv0.step;
2212       delta = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base);
2213       delta = lowpart_subreg (mode, delta, comp_mode);
2214       delta = simplify_gen_binary (UMOD, mode, delta, step);
2215       may_xform = const0_rtx;
2216       may_not_xform = const_true_rtx;
2217
2218       if (GET_CODE (delta) == CONST_INT)
2219         {
2220           if (was_sharp && INTVAL (delta) == INTVAL (step) - 1)
2221             {
2222               /* A special case.  We have transformed condition of type
2223                  for (i = 0; i < 4; i += 4)
2224                  into
2225                  for (i = 0; i <= 3; i += 4)
2226                  obviously if the test for overflow during that transformation
2227                  passed, we cannot overflow here.  Most importantly any
2228                  loop with sharp end condition and step 1 falls into this
2229                  category, so handling this case specially is definitely
2230                  worth the troubles.  */
2231               may_xform = const_true_rtx;
2232             }
2233           else if (iv0.step == const0_rtx)
2234             {
2235               bound = simplify_gen_binary (PLUS, comp_mode, mmin, step);
2236               bound = simplify_gen_binary (MINUS, comp_mode, bound, delta);
2237               bound = lowpart_subreg (mode, bound, comp_mode);
2238               tmp = lowpart_subreg (mode, iv0.base, comp_mode);
2239               may_xform = simplify_gen_relational (cond, SImode, mode,
2240                                                    bound, tmp);
2241               may_not_xform = simplify_gen_relational (reverse_condition (cond),
2242                                                        SImode, mode,
2243                                                        bound, tmp);
2244             }
2245           else
2246             {
2247               bound = simplify_gen_binary (MINUS, comp_mode, mmax, step);
2248               bound = simplify_gen_binary (PLUS, comp_mode, bound, delta);
2249               bound = lowpart_subreg (mode, bound, comp_mode);
2250               tmp = lowpart_subreg (mode, iv1.base, comp_mode);
2251               may_xform = simplify_gen_relational (cond, SImode, mode,
2252                                                    tmp, bound);
2253               may_not_xform = simplify_gen_relational (reverse_condition (cond),
2254                                                        SImode, mode,
2255                                                        tmp, bound);
2256             }
2257         }
2258
2259       if (may_xform != const0_rtx)
2260         {
2261           /* We perform the transformation always provided that it is not
2262              completely senseless.  This is OK, as we would need this assumption
2263              to determine the number of iterations anyway.  */
2264           if (may_xform != const_true_rtx)
2265             {
2266               /* If the step is a power of two and the final value we have
2267                  computed overflows, the cycle is infinite.  Otherwise it
2268                  is nontrivial to compute the number of iterations.  */
2269               if (step_is_pow2)
2270                 desc->infinite = alloc_EXPR_LIST (0, may_not_xform,
2271                                                   desc->infinite);
2272               else
2273                 desc->assumptions = alloc_EXPR_LIST (0, may_xform,
2274                                                      desc->assumptions);
2275             }
2276
2277           /* We are going to lose some information about upper bound on
2278              number of iterations in this step, so record the information
2279              here.  */
2280           inc = INTVAL (iv0.step) - INTVAL (iv1.step);
2281           if (GET_CODE (iv1.base) == CONST_INT)
2282             up = INTVAL (iv1.base);
2283           else
2284             up = INTVAL (mode_mmax) - inc;
2285           down = INTVAL (GET_CODE (iv0.base) == CONST_INT
2286                          ? iv0.base
2287                          : mode_mmin);
2288           desc->niter_max = (up - down) / inc + 1;
2289
2290           if (iv0.step == const0_rtx)
2291             {
2292               iv0.base = simplify_gen_binary (PLUS, comp_mode, iv0.base, delta);
2293               iv0.base = simplify_gen_binary (MINUS, comp_mode, iv0.base, step);
2294             }
2295           else
2296             {
2297               iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, delta);
2298               iv1.base = simplify_gen_binary (PLUS, comp_mode, iv1.base, step);
2299             }
2300
2301           tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2302           tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2303           assumption = simplify_gen_relational (reverse_condition (cond),
2304                                                 SImode, mode, tmp0, tmp1);
2305           if (assumption == const_true_rtx)
2306             goto zero_iter_simplify;
2307           else if (assumption != const0_rtx)
2308             desc->noloop_assumptions =
2309                     alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2310           cond = NE;
2311         }
2312     }
2313
2314   /* Count the number of iterations.  */
2315   if (cond == NE)
2316     {
2317       /* Everything we do here is just arithmetics modulo size of mode.  This
2318          makes us able to do more involved computations of number of iterations
2319          than in other cases.  First transform the condition into shape
2320          s * i <> c, with s positive.  */
2321       iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base);
2322       iv0.base = const0_rtx;
2323       iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step);
2324       iv1.step = const0_rtx;
2325       if (INTVAL (iv0.step) < 0)
2326         {
2327           iv0.step = simplify_gen_unary (NEG, comp_mode, iv0.step, mode);
2328           iv1.base = simplify_gen_unary (NEG, comp_mode, iv1.base, mode);
2329         }
2330       iv0.step = lowpart_subreg (mode, iv0.step, comp_mode);
2331
2332       /* Let nsd (s, size of mode) = d.  If d does not divide c, the loop
2333          is infinite.  Otherwise, the number of iterations is
2334          (inverse(s/d) * (c/d)) mod (size of mode/d).  */
2335       s = INTVAL (iv0.step); d = 1;
2336       while (s % 2 != 1)
2337         {
2338           s /= 2;
2339           d *= 2;
2340           size--;
2341         }
2342       bound = GEN_INT (((unsigned HOST_WIDEST_INT) 1 << (size - 1 ) << 1) - 1);
2343
2344       tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2345       tmp = simplify_gen_binary (UMOD, mode, tmp1, GEN_INT (d));
2346       assumption = simplify_gen_relational (NE, SImode, mode, tmp, const0_rtx);
2347       desc->infinite = alloc_EXPR_LIST (0, assumption, desc->infinite);
2348
2349       tmp = simplify_gen_binary (UDIV, mode, tmp1, GEN_INT (d));
2350       inv = inverse (s, size);
2351       tmp = simplify_gen_binary (MULT, mode, tmp, gen_int_mode (inv, mode));
2352       desc->niter_expr = simplify_gen_binary (AND, mode, tmp, bound);
2353     }
2354   else
2355     {
2356       if (iv1.step == const0_rtx)
2357         /* Condition in shape a + s * i <= b
2358            We must know that b + s does not overflow and a <= b + s and then we
2359            can compute number of iterations as (b + s - a) / s.  (It might
2360            seem that we in fact could be more clever about testing the b + s
2361            overflow condition using some information about b - a mod s,
2362            but it was already taken into account during LE -> NE transform).  */
2363         {
2364           step = iv0.step;
2365           tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2366           tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2367
2368           bound = simplify_gen_binary (MINUS, mode, mode_mmax,
2369                                        lowpart_subreg (mode, step,
2370                                                        comp_mode));
2371           if (step_is_pow2)
2372             {
2373               rtx t0, t1;
2374
2375               /* If s is power of 2, we know that the loop is infinite if
2376                  a % s <= b % s and b + s overflows.  */
2377               assumption = simplify_gen_relational (reverse_condition (cond),
2378                                                     SImode, mode,
2379                                                     tmp1, bound);
2380
2381               t0 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp0), step);
2382               t1 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp1), step);
2383               tmp = simplify_gen_relational (cond, SImode, mode, t0, t1);
2384               assumption = simplify_gen_binary (AND, SImode, assumption, tmp);
2385               desc->infinite =
2386                       alloc_EXPR_LIST (0, assumption, desc->infinite);
2387             }
2388           else
2389             {
2390               assumption = simplify_gen_relational (cond, SImode, mode,
2391                                                     tmp1, bound);
2392               desc->assumptions =
2393                       alloc_EXPR_LIST (0, assumption, desc->assumptions);
2394             }
2395
2396           tmp = simplify_gen_binary (PLUS, comp_mode, iv1.base, iv0.step);
2397           tmp = lowpart_subreg (mode, tmp, comp_mode);
2398           assumption = simplify_gen_relational (reverse_condition (cond),
2399                                                 SImode, mode, tmp0, tmp);
2400
2401           delta = simplify_gen_binary (PLUS, mode, tmp1, step);
2402           delta = simplify_gen_binary (MINUS, mode, delta, tmp0);
2403         }
2404       else
2405         {
2406           /* Condition in shape a <= b - s * i
2407              We must know that a - s does not overflow and a - s <= b and then
2408              we can again compute number of iterations as (b - (a - s)) / s.  */
2409           step = simplify_gen_unary (NEG, mode, iv1.step, mode);
2410           tmp0 = lowpart_subreg (mode, iv0.base, comp_mode);
2411           tmp1 = lowpart_subreg (mode, iv1.base, comp_mode);
2412
2413           bound = simplify_gen_binary (PLUS, mode, mode_mmin,
2414                                        lowpart_subreg (mode, step, comp_mode));
2415           if (step_is_pow2)
2416             {
2417               rtx t0, t1;
2418
2419               /* If s is power of 2, we know that the loop is infinite if
2420                  a % s <= b % s and a - s overflows.  */
2421               assumption = simplify_gen_relational (reverse_condition (cond),
2422                                                     SImode, mode,
2423                                                     bound, tmp0);
2424
2425               t0 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp0), step);
2426               t1 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp1), step);
2427               tmp = simplify_gen_relational (cond, SImode, mode, t0, t1);
2428               assumption = simplify_gen_binary (AND, SImode, assumption, tmp);
2429               desc->infinite =
2430                       alloc_EXPR_LIST (0, assumption, desc->infinite);
2431             }
2432           else
2433             {
2434               assumption = simplify_gen_relational (cond, SImode, mode,
2435                                                     bound, tmp0);
2436               desc->assumptions =
2437                       alloc_EXPR_LIST (0, assumption, desc->assumptions);
2438             }
2439
2440           tmp = simplify_gen_binary (PLUS, comp_mode, iv0.base, iv1.step);
2441           tmp = lowpart_subreg (mode, tmp, comp_mode);
2442           assumption = simplify_gen_relational (reverse_condition (cond),
2443                                                 SImode, mode,
2444                                                 tmp, tmp1);
2445           delta = simplify_gen_binary (MINUS, mode, tmp0, step);
2446           delta = simplify_gen_binary (MINUS, mode, tmp1, delta);
2447         }
2448       if (assumption == const_true_rtx)
2449         goto zero_iter_simplify;
2450       else if (assumption != const0_rtx)
2451         desc->noloop_assumptions =
2452                 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions);
2453       delta = simplify_gen_binary (UDIV, mode, delta, step);
2454       desc->niter_expr = delta;
2455     }
2456
2457   old_niter = desc->niter_expr;
2458
2459   simplify_using_initial_values (loop, AND, &desc->assumptions);
2460   if (desc->assumptions
2461       && XEXP (desc->assumptions, 0) == const0_rtx)
2462     goto fail;
2463   simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions);
2464   simplify_using_initial_values (loop, IOR, &desc->infinite);
2465   simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr);
2466
2467   /* Rerun the simplification.  Consider code (created by copying loop headers)
2468
2469      i = 0;
2470
2471      if (0 < n)
2472        {
2473          do
2474            {
2475              i++;
2476            } while (i < n);
2477        }
2478
2479     The first pass determines that i = 0, the second pass uses it to eliminate
2480     noloop assumption.  */
2481
2482   simplify_using_initial_values (loop, AND, &desc->assumptions);
2483   if (desc->assumptions
2484       && XEXP (desc->assumptions, 0) == const0_rtx)
2485     goto fail;
2486   simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions);
2487   simplify_using_initial_values (loop, IOR, &desc->infinite);
2488   simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr);
2489
2490   if (desc->noloop_assumptions
2491       && XEXP (desc->noloop_assumptions, 0) == const_true_rtx)
2492     goto zero_iter;
2493
2494   if (GET_CODE (desc->niter_expr) == CONST_INT)
2495     {
2496       unsigned HOST_WIDEST_INT val = INTVAL (desc->niter_expr);
2497
2498       desc->const_iter = true;
2499       desc->niter_max = desc->niter = val & GET_MODE_MASK (desc->mode);
2500     }
2501   else
2502     {
2503       if (!desc->niter_max)
2504         desc->niter_max = determine_max_iter (desc);
2505
2506       /* simplify_using_initial_values does a copy propagation on the registers
2507          in the expression for the number of iterations.  This prolongs life
2508          ranges of registers and increases register pressure, and usually
2509          brings no gain (and if it happens to do, the cse pass will take care
2510          of it anyway).  So prevent this behavior, unless it enabled us to
2511          derive that the number of iterations is a constant.  */
2512       desc->niter_expr = old_niter;
2513     }
2514
2515   return;
2516
2517 zero_iter_simplify:
2518   /* Simplify the assumptions.  */
2519   simplify_using_initial_values (loop, AND, &desc->assumptions);
2520   if (desc->assumptions
2521       && XEXP (desc->assumptions, 0) == const0_rtx)
2522     goto fail;
2523   simplify_using_initial_values (loop, IOR, &desc->infinite);
2524
2525   /* Fallthru.  */
2526 zero_iter:
2527   desc->const_iter = true;
2528   desc->niter = 0;
2529   desc->niter_max = 0;
2530   desc->noloop_assumptions = NULL_RTX;
2531   desc->niter_expr = const0_rtx;
2532   return;
2533
2534 fail:
2535   desc->simple_p = false;
2536   return;
2537 }
2538
2539 /* Checks whether E is a simple exit from LOOP and stores its description
2540    into DESC.  */
2541
2542 static void
2543 check_simple_exit (struct loop *loop, edge e, struct niter_desc *desc)
2544 {
2545   basic_block exit_bb;
2546   rtx condition, at;
2547   edge ein;
2548
2549   exit_bb = e->src;
2550   desc->simple_p = false;
2551
2552   /* It must belong directly to the loop.  */
2553   if (exit_bb->loop_father != loop)
2554     return;
2555
2556   /* It must be tested (at least) once during any iteration.  */
2557   if (!dominated_by_p (CDI_DOMINATORS, loop->latch, exit_bb))
2558     return;
2559
2560   /* It must end in a simple conditional jump.  */
2561   if (!any_condjump_p (BB_END (exit_bb)))
2562     return;
2563
2564   ein = EDGE_SUCC (exit_bb, 0);
2565   if (ein == e)
2566     ein = EDGE_SUCC (exit_bb, 1);
2567
2568   desc->out_edge = e;
2569   desc->in_edge = ein;
2570
2571   /* Test whether the condition is suitable.  */
2572   if (!(condition = get_condition (BB_END (ein->src), &at, false, false)))
2573     return;
2574
2575   if (ein->flags & EDGE_FALLTHRU)
2576     {
2577       condition = reversed_condition (condition);
2578       if (!condition)
2579         return;
2580     }
2581
2582   /* Check that we are able to determine number of iterations and fill
2583      in information about it.  */
2584   iv_number_of_iterations (loop, at, condition, desc);
2585 }
2586
2587 /* Finds a simple exit of LOOP and stores its description into DESC.  */
2588
2589 void
2590 find_simple_exit (struct loop *loop, struct niter_desc *desc)
2591 {
2592   unsigned i;
2593   basic_block *body;
2594   edge e;
2595   struct niter_desc act;
2596   bool any = false;
2597   edge_iterator ei;
2598
2599   desc->simple_p = false;
2600   body = get_loop_body (loop);
2601
2602   for (i = 0; i < loop->num_nodes; i++)
2603     {
2604       FOR_EACH_EDGE (e, ei, body[i]->succs)
2605         {
2606           if (flow_bb_inside_loop_p (loop, e->dest))
2607             continue;
2608
2609           check_simple_exit (loop, e, &act);
2610           if (!act.simple_p)
2611             continue;
2612
2613           if (!any)
2614             any = true;
2615           else
2616             {
2617               /* Prefer constant iterations; the less the better.  */
2618               if (!act.const_iter
2619                   || (desc->const_iter && act.niter >= desc->niter))
2620                 continue;
2621
2622               /* Also if the actual exit may be infinite, while the old one
2623                  not, prefer the old one.  */
2624               if (act.infinite && !desc->infinite)
2625                 continue;
2626             }
2627
2628           *desc = act;
2629         }
2630     }
2631
2632   if (dump_file)
2633     {
2634       if (desc->simple_p)
2635         {
2636           fprintf (dump_file, "Loop %d is simple:\n", loop->num);
2637           fprintf (dump_file, "  simple exit %d -> %d\n",
2638                    desc->out_edge->src->index,
2639                    desc->out_edge->dest->index);
2640           if (desc->assumptions)
2641             {
2642               fprintf (dump_file, "  assumptions: ");
2643               print_rtl (dump_file, desc->assumptions);
2644               fprintf (dump_file, "\n");
2645             }
2646           if (desc->noloop_assumptions)
2647             {
2648               fprintf (dump_file, "  does not roll if: ");
2649               print_rtl (dump_file, desc->noloop_assumptions);
2650               fprintf (dump_file, "\n");
2651             }
2652           if (desc->infinite)
2653             {
2654               fprintf (dump_file, "  infinite if: ");
2655               print_rtl (dump_file, desc->infinite);
2656               fprintf (dump_file, "\n");
2657             }
2658
2659           fprintf (dump_file, "  number of iterations: ");
2660           print_rtl (dump_file, desc->niter_expr);
2661           fprintf (dump_file, "\n");
2662
2663           fprintf (dump_file, "  upper bound: ");
2664           fprintf (dump_file, HOST_WIDEST_INT_PRINT_DEC, desc->niter_max);
2665           fprintf (dump_file, "\n");
2666         }
2667       else
2668         fprintf (dump_file, "Loop %d is not simple.\n", loop->num);
2669     }
2670
2671   free (body);
2672 }
2673
2674 /* Creates a simple loop description of LOOP if it was not computed
2675    already.  */
2676
2677 struct niter_desc *
2678 get_simple_loop_desc (struct loop *loop)
2679 {
2680   struct niter_desc *desc = simple_loop_desc (loop);
2681
2682   if (desc)
2683     return desc;
2684
2685   desc = XNEW (struct niter_desc);
2686   iv_analysis_loop_init (loop);
2687   find_simple_exit (loop, desc);
2688   loop->aux = desc;
2689
2690   if (desc->simple_p && (desc->assumptions || desc->infinite))
2691     {
2692       const char *wording;
2693
2694       /* Assume that no overflow happens and that the loop is finite.
2695          We already warned at the tree level if we ran optimizations there.  */
2696       if (!flag_tree_loop_optimize && warn_unsafe_loop_optimizations)
2697         {
2698           if (desc->infinite)
2699             {
2700               wording =
2701                 flag_unsafe_loop_optimizations
2702                 ? N_("assuming that the loop is not infinite")
2703                 : N_("cannot optimize possibly infinite loops");
2704               warning (OPT_Wunsafe_loop_optimizations, "%s",
2705                        gettext (wording));
2706             }
2707           if (desc->assumptions)
2708             {
2709               wording =
2710                 flag_unsafe_loop_optimizations
2711                 ? N_("assuming that the loop counter does not overflow")
2712                 : N_("cannot optimize loop, the loop counter may overflow");
2713               warning (OPT_Wunsafe_loop_optimizations, "%s",
2714                        gettext (wording));
2715             }
2716         }
2717
2718       if (flag_unsafe_loop_optimizations)
2719         {
2720           desc->assumptions = NULL_RTX;
2721           desc->infinite = NULL_RTX;
2722         }
2723     }
2724
2725   return desc;
2726 }
2727
2728 /* Releases simple loop description for LOOP.  */
2729
2730 void
2731 free_simple_loop_desc (struct loop *loop)
2732 {
2733   struct niter_desc *desc = simple_loop_desc (loop);
2734
2735   if (!desc)
2736     return;
2737
2738   free (desc);
2739   loop->aux = NULL;
2740 }