gcc/tree-ssa-loop-ivopts.c

   1 /* Induction variable optimizations.
   2    Copyright (C) 2003, 2004, 2005 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the
   8 Free Software Foundation; either version 2, or (at your option) any
   9 later version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT
  12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING.  If not, write to the Free
  18 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
  19 02110-1301, USA.  */
  20
  21 /* This pass tries to find the optimal set of induction variables for the loop.
  22    It optimizes just the basic linear induction variables (although adding
  23    support for other types should not be too hard).  It includes the
  24    optimizations commonly known as strength reduction, induction variable
  25    coalescing and induction variable elimination.  It does it in the
  26    following steps:
  27
  28    1) The interesting uses of induction variables are found.  This includes
  29
  30       -- uses of induction variables in non-linear expressions
  31       -- addresses of arrays
  32       -- comparisons of induction variables
  33
  34    2) Candidates for the induction variables are found.  This includes
  35
  36       -- old induction variables
  37       -- the variables defined by expressions derived from the "interesting
  38          uses" above
  39
  40    3) The optimal (w.r. to a cost function) set of variables is chosen.  The
  41       cost function assigns a cost to sets of induction variables and consists
  42       of three parts:
  43
  44       -- The use costs.  Each of the interesting uses chooses the best induction
  45          variable in the set and adds its cost to the sum.  The cost reflects
  46          the time spent on modifying the induction variables value to be usable
  47          for the given purpose (adding base and offset for arrays, etc.).
  48       -- The variable costs.  Each of the variables has a cost assigned that
  49          reflects the costs associated with incrementing the value of the
  50          variable.  The original variables are somewhat preferred.
  51       -- The set cost.  Depending on the size of the set, extra cost may be
  52          added to reflect register pressure.
  53
  54       All the costs are defined in a machine-specific way, using the target
  55       hooks and machine descriptions to determine them.
  56
  57    4) The trees are transformed to use the new variables, the dead code is
  58       removed.
  59
  60    All of this is done loop by loop.  Doing it globally is theoretically
  61    possible, it might give a better performance and it might enable us
  62    to decide costs more precisely, but getting all the interactions right
  63    would be complicated.  */
  64
  65 #include "config.h"
  66 #include "system.h"
  67 #include "coretypes.h"
  68 #include "tm.h"
  69 #include "tree.h"
  70 #include "rtl.h"
  71 #include "tm_p.h"
  72 #include "hard-reg-set.h"
  73 #include "basic-block.h"
  74 #include "output.h"
  75 #include "diagnostic.h"
  76 #include "tree-flow.h"
  77 #include "tree-dump.h"
  78 #include "timevar.h"
  79 #include "cfgloop.h"
  80 #include "varray.h"
  81 #include "expr.h"
  82 #include "tree-pass.h"
  83 #include "ggc.h"
  84 #include "insn-config.h"
  85 #include "recog.h"
  86 #include "hashtab.h"
  87 #include "tree-chrec.h"
  88 #include "tree-scalar-evolution.h"
  89 #include "cfgloop.h"
  90 #include "params.h"
  91 #include "langhooks.h"
  92
  93 /* The infinite cost.  */
  94 #define INFTY 10000000
  95
  96 /* The expected number of loop iterations.  TODO -- use profiling instead of
  97    this.  */
  98 #define AVG_LOOP_NITER(LOOP) 5
  99
 100
 101 /* Representation of the induction variable.  */
 102 struct iv
 103 {
 104   tree base;            /* Initial value of the iv.  */
 105   tree base_object;     /* A memory object to that the induction variable points.  */
 106   tree step;            /* Step of the iv (constant only).  */
 107   tree ssa_name;        /* The ssa name with the value.  */
 108   bool biv_p;           /* Is it a biv?  */
 109   bool have_use_for;    /* Do we already have a use for it?  */
 110   unsigned use_id;      /* The identifier in the use if it is the case.  */
 111 };
 112
 113 /* Per-ssa version information (induction variable descriptions, etc.).  */
 114 struct version_info
 115 {
 116   tree name;            /* The ssa name.  */
 117   struct iv *iv;        /* Induction variable description.  */
 118   bool has_nonlin_use;  /* For a loop-level invariant, whether it is used in
 119                            an expression that is not an induction variable.  */
 120   unsigned inv_id;      /* Id of an invariant.  */
 121   bool preserve_biv;    /* For the original biv, whether to preserve it.  */
 122 };
 123
 124 /* Types of uses.  */
 125 enum use_type
 126 {
 127   USE_NONLINEAR_EXPR,   /* Use in a nonlinear expression.  */
 128   USE_ADDRESS,          /* Use in an address.  */
 129   USE_COMPARE           /* Use is a compare.  */
 130 };
 131
 132 /* The candidate - cost pair.  */
 133 struct cost_pair
 134 {
 135   struct iv_cand *cand; /* The candidate.  */
 136   unsigned cost;        /* The cost.  */
 137   bitmap depends_on;    /* The list of invariants that have to be
 138                            preserved.  */
 139   tree value;           /* For final value elimination, the expression for
 140                            the final value of the iv.  For iv elimination,
 141                            the new bound to compare with.  */
 142 };
 143
 144 /* Use.  */
 145 struct iv_use
 146 {
 147   unsigned id;          /* The id of the use.  */
 148   enum use_type type;   /* Type of the use.  */
 149   struct iv *iv;        /* The induction variable it is based on.  */
 150   tree stmt;            /* Statement in that it occurs.  */
 151   tree *op_p;           /* The place where it occurs.  */
 152   bitmap related_cands; /* The set of "related" iv candidates, plus the common
 153                            important ones.  */
 154
 155   unsigned n_map_members; /* Number of candidates in the cost_map list.  */
 156   struct cost_pair *cost_map;
 157                         /* The costs wrto the iv candidates.  */
 158
 159   struct iv_cand *selected;
 160                         /* The selected candidate.  */
 161 };
 162
 163 /* The position where the iv is computed.  */
 164 enum iv_position
 165 {
 166   IP_NORMAL,            /* At the end, just before the exit condition.  */
 167   IP_END,               /* At the end of the latch block.  */
 168   IP_ORIGINAL           /* The original biv.  */
 169 };
 170
 171 /* The induction variable candidate.  */
 172 struct iv_cand
 173 {
 174   unsigned id;          /* The number of the candidate.  */
 175   bool important;       /* Whether this is an "important" candidate, i.e. such
 176                            that it should be considered by all uses.  */
 177   enum iv_position pos; /* Where it is computed.  */
 178   tree incremented_at;  /* For original biv, the statement where it is
 179                            incremented.  */
 180   tree var_before;      /* The variable used for it before increment.  */
 181   tree var_after;       /* The variable used for it after increment.  */
 182   struct iv *iv;        /* The value of the candidate.  NULL for
 183                            "pseudocandidate" used to indicate the possibility
 184                            to replace the final value of an iv by direct
 185                            computation of the value.  */
 186   unsigned cost;        /* Cost of the candidate.  */
 187   bitmap depends_on;    /* The list of invariants that are used in step of the
 188                            biv.  */
 189 };
 190
 191 /* The data used by the induction variable optimizations.  */
 192
 193 typedef struct iv_use *iv_use_p;
 194 DEF_VEC_P(iv_use_p);
 195 DEF_VEC_ALLOC_P(iv_use_p,heap);
 196
 197 typedef struct iv_cand *iv_cand_p;
 198 DEF_VEC_P(iv_cand_p);
 199 DEF_VEC_ALLOC_P(iv_cand_p,heap);
 200
 201 struct ivopts_data
 202 {
 203   /* The currently optimized loop.  */
 204   struct loop *current_loop;
 205
 206   /* Number of registers used in it.  */
 207   unsigned regs_used;
 208
 209   /* Numbers of iterations for all exits of the current loop.  */
 210   htab_t niters;
 211
 212   /* The size of version_info array allocated.  */
 213   unsigned version_info_size;
 214
 215   /* The array of information for the ssa names.  */
 216   struct version_info *version_info;
 217
 218   /* The bitmap of indices in version_info whose value was changed.  */
 219   bitmap relevant;
 220
 221   /* The maximum invariant id.  */
 222   unsigned max_inv_id;
 223
 224   /* The uses of induction variables.  */
 225   VEC(iv_use_p,heap) *iv_uses;
 226
 227   /* The candidates.  */
 228   VEC(iv_cand_p,heap) *iv_candidates;
 229
 230   /* A bitmap of important candidates.  */
 231   bitmap important_candidates;
 232
 233   /* Whether to consider just related and important candidates when replacing a
 234      use.  */
 235   bool consider_all_candidates;
 236 };
 237
 238 /* An assignment of iv candidates to uses.  */
 239
 240 struct iv_ca
 241 {
 242   /* The number of uses covered by the assignment.  */
 243   unsigned upto;
 244
 245   /* Number of uses that cannot be expressed by the candidates in the set.  */
 246   unsigned bad_uses;
 247
 248   /* Candidate assigned to a use, together with the related costs.  */
 249   struct cost_pair **cand_for_use;
 250
 251   /* Number of times each candidate is used.  */
 252   unsigned *n_cand_uses;
 253
 254   /* The candidates used.  */
 255   bitmap cands;
 256
 257   /* The number of candidates in the set.  */
 258   unsigned n_cands;
 259
 260   /* Total number of registers needed.  */
 261   unsigned n_regs;
 262
 263   /* Total cost of expressing uses.  */
 264   unsigned cand_use_cost;
 265
 266   /* Total cost of candidates.  */
 267   unsigned cand_cost;
 268
 269   /* Number of times each invariant is used.  */
 270   unsigned *n_invariant_uses;
 271
 272   /* Total cost of the assignment.  */
 273   unsigned cost;
 274 };
 275
 276 /* Difference of two iv candidate assignments.  */
 277
 278 struct iv_ca_delta
 279 {
 280   /* Changed use.  */
 281   struct iv_use *use;
 282
 283   /* An old assignment (for rollback purposes).  */
 284   struct cost_pair *old_cp;
 285
 286   /* A new assignment.  */
 287   struct cost_pair *new_cp;
 288
 289   /* Next change in the list.  */
 290   struct iv_ca_delta *next_change;
 291 };
 292
 293 /* Bound on number of candidates below that all candidates are considered.  */
 294
 295 #define CONSIDER_ALL_CANDIDATES_BOUND \
 296   ((unsigned) PARAM_VALUE (PARAM_IV_CONSIDER_ALL_CANDIDATES_BOUND))
 297
 298 /* If there are more iv occurrences, we just give up (it is quite unlikely that
 299    optimizing such a loop would help, and it would take ages).  */
 300
 301 #define MAX_CONSIDERED_USES \
 302   ((unsigned) PARAM_VALUE (PARAM_IV_MAX_CONSIDERED_USES))
 303
 304 /* If there are at most this number of ivs in the set, try removing unnecessary
 305    ivs from the set always.  */
 306
 307 #define ALWAYS_PRUNE_CAND_SET_BOUND \
 308   ((unsigned) PARAM_VALUE (PARAM_IV_ALWAYS_PRUNE_CAND_SET_BOUND))
 309
 310 /* The list of trees for that the decl_rtl field must be reset is stored
 311    here.  */
 312
 313 static VEC(tree,heap) *decl_rtl_to_reset;
 314
 315 /* Number of uses recorded in DATA.  */
 316
 317 static inline unsigned
 318 n_iv_uses (struct ivopts_data *data)
 319 {
 320   return VEC_length (iv_use_p, data->iv_uses);
 321 }
 322
 323 /* Ith use recorded in DATA.  */
 324
 325 static inline struct iv_use *
 326 iv_use (struct ivopts_data *data, unsigned i)
 327 {
 328   return VEC_index (iv_use_p, data->iv_uses, i);
 329 }
 330
 331 /* Number of candidates recorded in DATA.  */
 332
 333 static inline unsigned
 334 n_iv_cands (struct ivopts_data *data)
 335 {
 336   return VEC_length (iv_cand_p, data->iv_candidates);
 337 }
 338
 339 /* Ith candidate recorded in DATA.  */
 340
 341 static inline struct iv_cand *
 342 iv_cand (struct ivopts_data *data, unsigned i)
 343 {
 344   return VEC_index (iv_cand_p, data->iv_candidates, i);
 345 }
 346
 347 /* The single loop exit if it dominates the latch, NULL otherwise.  */
 348
 349 edge
 350 single_dom_exit (struct loop *loop)
 351 {
 352   edge exit = loop->single_exit;
 353
 354   if (!exit)
 355     return NULL;
 356
 357   if (!just_once_each_iteration_p (loop, exit->src))
 358     return NULL;
 359
 360   return exit;
 361 }
 362
 363 /* Dumps information about the induction variable IV to FILE.  */
 364
 365 extern void dump_iv (FILE *, struct iv *);
 366 void
 367 dump_iv (FILE *file, struct iv *iv)
 368 {
 369   if (iv->ssa_name)
 370     {
 371       fprintf (file, "ssa name ");
 372       print_generic_expr (file, iv->ssa_name, TDF_SLIM);
 373       fprintf (file, "\n");
 374     }
 375
 376   fprintf (file, "  type ");
 377   print_generic_expr (file, TREE_TYPE (iv->base), TDF_SLIM);
 378   fprintf (file, "\n");
 379
 380   if (iv->step)
 381     {
 382       fprintf (file, "  base ");
 383       print_generic_expr (file, iv->base, TDF_SLIM);
 384       fprintf (file, "\n");
 385
 386       fprintf (file, "  step ");
 387       print_generic_expr (file, iv->step, TDF_SLIM);
 388       fprintf (file, "\n");
 389     }
 390   else
 391     {
 392       fprintf (file, "  invariant ");
 393       print_generic_expr (file, iv->base, TDF_SLIM);
 394       fprintf (file, "\n");
 395     }
 396
 397   if (iv->base_object)
 398     {
 399       fprintf (file, "  base object ");
 400       print_generic_expr (file, iv->base_object, TDF_SLIM);
 401       fprintf (file, "\n");
 402     }
 403
 404   if (iv->biv_p)
 405     fprintf (file, "  is a biv\n");
 406 }
 407
 408 /* Dumps information about the USE to FILE.  */
 409
 410 extern void dump_use (FILE *, struct iv_use *);
 411 void
 412 dump_use (FILE *file, struct iv_use *use)
 413 {
 414   fprintf (file, "use %d\n", use->id);
 415
 416   switch (use->type)
 417     {
 418     case USE_NONLINEAR_EXPR:
 419       fprintf (file, "  generic\n");
 420       break;
 421
 422     case USE_ADDRESS:
 423       fprintf (file, "  address\n");
 424       break;
 425
 426     case USE_COMPARE:
 427       fprintf (file, "  compare\n");
 428       break;
 429
 430     default:
 431       gcc_unreachable ();
 432     }
 433
 434   fprintf (file, "  in statement ");
 435   print_generic_expr (file, use->stmt, TDF_SLIM);
 436   fprintf (file, "\n");
 437
 438   fprintf (file, "  at position ");
 439   if (use->op_p)
 440     print_generic_expr (file, *use->op_p, TDF_SLIM);
 441   fprintf (file, "\n");
 442
 443   dump_iv (file, use->iv);
 444
 445   if (use->related_cands)
 446     {
 447       fprintf (file, "  related candidates ");
 448       dump_bitmap (file, use->related_cands);
 449     }
 450 }
 451
 452 /* Dumps information about the uses to FILE.  */
 453
 454 extern void dump_uses (FILE *, struct ivopts_data *);
 455 void
 456 dump_uses (FILE *file, struct ivopts_data *data)
 457 {
 458   unsigned i;
 459   struct iv_use *use;
 460
 461   for (i = 0; i < n_iv_uses (data); i++)
 462     {
 463       use = iv_use (data, i);
 464
 465       dump_use (file, use);
 466       fprintf (file, "\n");
 467     }
 468 }
 469
 470 /* Dumps information about induction variable candidate CAND to FILE.  */
 471
 472 extern void dump_cand (FILE *, struct iv_cand *);
 473 void
 474 dump_cand (FILE *file, struct iv_cand *cand)
 475 {
 476   struct iv *iv = cand->iv;
 477
 478   fprintf (file, "candidate %d%s\n",
 479            cand->id, cand->important ? " (important)" : "");
 480
 481   if (cand->depends_on)
 482     {
 483       fprintf (file, "  depends on ");
 484       dump_bitmap (file, cand->depends_on);
 485     }
 486
 487   if (!iv)
 488     {
 489       fprintf (file, "  final value replacement\n");
 490       return;
 491     }
 492
 493   switch (cand->pos)
 494     {
 495     case IP_NORMAL:
 496       fprintf (file, "  incremented before exit test\n");
 497       break;
 498
 499     case IP_END:
 500       fprintf (file, "  incremented at end\n");
 501       break;
 502
 503     case IP_ORIGINAL:
 504       fprintf (file, "  original biv\n");
 505       break;
 506     }
 507
 508   dump_iv (file, iv);
 509 }
 510
 511 /* Returns the info for ssa version VER.  */
 512
 513 static inline struct version_info *
 514 ver_info (struct ivopts_data *data, unsigned ver)
 515 {
 516   return data->version_info + ver;
 517 }
 518
 519 /* Returns the info for ssa name NAME.  */
 520
 521 static inline struct version_info *
 522 name_info (struct ivopts_data *data, tree name)
 523 {
 524   return ver_info (data, SSA_NAME_VERSION (name));
 525 }
 526
 527 /* Checks whether there exists number X such that X * B = A, counting modulo
 528    2^BITS.  */
 529
 530 static bool
 531 divide (unsigned bits, unsigned HOST_WIDE_INT a, unsigned HOST_WIDE_INT b,
 532         HOST_WIDE_INT *x)
 533 {
 534   unsigned HOST_WIDE_INT mask = ~(~(unsigned HOST_WIDE_INT) 0 << (bits - 1) << 1);
 535   unsigned HOST_WIDE_INT inv, ex, val;
 536   unsigned i;
 537
 538   a &= mask;
 539   b &= mask;
 540
 541   /* First divide the whole equation by 2 as long as possible.  */
 542   while (!(a & 1) && !(b & 1))
 543     {
 544       a >>= 1;
 545       b >>= 1;
 546       bits--;
 547       mask >>= 1;
 548     }
 549
 550   if (!(b & 1))
 551     {
 552       /* If b is still even, a is odd and there is no such x.  */
 553       return false;
 554     }
 555
 556   /* Find the inverse of b.  We compute it as
 557      b^(2^(bits - 1) - 1) (mod 2^bits).  */
 558   inv = 1;
 559   ex = b;
 560   for (i = 0; i < bits - 1; i++)
 561     {
 562       inv = (inv * ex) & mask;
 563       ex = (ex * ex) & mask;
 564     }
 565
 566   val = (a * inv) & mask;
 567
 568   gcc_assert (((val * b) & mask) == a);
 569
 570   if ((val >> (bits - 1)) & 1)
 571     val |= ~mask;
 572
 573   *x = val;
 574
 575   return true;
 576 }
 577
 578 /* Returns true if STMT is after the place where the IP_NORMAL ivs will be
 579    emitted in LOOP.  */
 580
 581 static bool
 582 stmt_after_ip_normal_pos (struct loop *loop, tree stmt)
 583 {
 584   basic_block bb = ip_normal_pos (loop), sbb = bb_for_stmt (stmt);
 585
 586   gcc_assert (bb);
 587
 588   if (sbb == loop->latch)
 589     return true;
 590
 591   if (sbb != bb)
 592     return false;
 593
 594   return stmt == last_stmt (bb);
 595 }
 596
 597 /* Returns true if STMT if after the place where the original induction
 598    variable CAND is incremented.  */
 599
 600 static bool
 601 stmt_after_ip_original_pos (struct iv_cand *cand, tree stmt)
 602 {
 603   basic_block cand_bb = bb_for_stmt (cand->incremented_at);
 604   basic_block stmt_bb = bb_for_stmt (stmt);
 605   block_stmt_iterator bsi;
 606
 607   if (!dominated_by_p (CDI_DOMINATORS, stmt_bb, cand_bb))
 608     return false;
 609
 610   if (stmt_bb != cand_bb)
 611     return true;
 612
 613   /* Scan the block from the end, since the original ivs are usually
 614      incremented at the end of the loop body.  */
 615   for (bsi = bsi_last (stmt_bb); ; bsi_prev (&bsi))
 616     {
 617       if (bsi_stmt (bsi) == cand->incremented_at)
 618         return false;
 619       if (bsi_stmt (bsi) == stmt)
 620         return true;
 621     }
 622 }
 623
 624 /* Returns true if STMT if after the place where the induction variable
 625    CAND is incremented in LOOP.  */
 626
 627 static bool
 628 stmt_after_increment (struct loop *loop, struct iv_cand *cand, tree stmt)
 629 {
 630   switch (cand->pos)
 631     {
 632     case IP_END:
 633       return false;
 634
 635     case IP_NORMAL:
 636       return stmt_after_ip_normal_pos (loop, stmt);
 637
 638     case IP_ORIGINAL:
 639       return stmt_after_ip_original_pos (cand, stmt);
 640
 641     default:
 642       gcc_unreachable ();
 643     }
 644 }
 645
 646 /* Returns true if EXP is a ssa name that occurs in an abnormal phi node.  */
 647
 648 static bool
 649 abnormal_ssa_name_p (tree exp)
 650 {
 651   if (!exp)
 652     return false;
 653
 654   if (TREE_CODE (exp) != SSA_NAME)
 655     return false;
 656
 657   return SSA_NAME_OCCURS_IN_ABNORMAL_PHI (exp) != 0;
 658 }
 659
 660 /* Returns false if BASE or INDEX contains a ssa name that occurs in an
 661    abnormal phi node.  Callback for for_each_index.  */
 662
 663 static bool
 664 idx_contains_abnormal_ssa_name_p (tree base, tree *index,
 665                                   void *data ATTRIBUTE_UNUSED)
 666 {
 667   if (TREE_CODE (base) == ARRAY_REF)
 668     {
 669       if (abnormal_ssa_name_p (TREE_OPERAND (base, 2)))
 670         return false;
 671       if (abnormal_ssa_name_p (TREE_OPERAND (base, 3)))
 672         return false;
 673     }
 674
 675   return !abnormal_ssa_name_p (*index);
 676 }
 677
 678 /* Returns true if EXPR contains a ssa name that occurs in an
 679    abnormal phi node.  */
 680
 681 bool
 682 contains_abnormal_ssa_name_p (tree expr)
 683 {
 684   enum tree_code code;
 685   enum tree_code_class class;
 686
 687   if (!expr)
 688     return false;
 689
 690   code = TREE_CODE (expr);
 691   class = TREE_CODE_CLASS (code);
 692
 693   if (code == SSA_NAME)
 694     return SSA_NAME_OCCURS_IN_ABNORMAL_PHI (expr) != 0;
 695
 696   if (code == INTEGER_CST
 697       || is_gimple_min_invariant (expr))
 698     return false;
 699
 700   if (code == ADDR_EXPR)
 701     return !for_each_index (&TREE_OPERAND (expr, 0),
 702                             idx_contains_abnormal_ssa_name_p,
 703                             NULL);
 704
 705   switch (class)
 706     {
 707     case tcc_binary:
 708     case tcc_comparison:
 709       if (contains_abnormal_ssa_name_p (TREE_OPERAND (expr, 1)))
 710         return true;
 711
 712       /* Fallthru.  */
 713     case tcc_unary:
 714       if (contains_abnormal_ssa_name_p (TREE_OPERAND (expr, 0)))
 715         return true;
 716
 717       break;
 718
 719     default:
 720       gcc_unreachable ();
 721     }
 722
 723   return false;
 724 }
 725
 726 /* Element of the table in that we cache the numbers of iterations obtained
 727    from exits of the loop.  */
 728
 729 struct nfe_cache_elt
 730 {
 731   /* The edge for that the number of iterations is cached.  */
 732   edge exit;
 733
 734   /* Number of iterations corresponding to this exit, or NULL if it cannot be
 735      determined.  */
 736   tree niter;
 737 };
 738
 739 /* Hash function for nfe_cache_elt E.  */
 740
 741 static hashval_t
 742 nfe_hash (const void *e)
 743 {
 744   const struct nfe_cache_elt *elt = e;
 745
 746   return htab_hash_pointer (elt->exit);
 747 }
 748
 749 /* Equality function for nfe_cache_elt E1 and edge E2.  */
 750
 751 static int
 752 nfe_eq (const void *e1, const void *e2)
 753 {
 754   const struct nfe_cache_elt *elt1 = e1;
 755
 756   return elt1->exit == e2;
 757 }
 758
 759 /*  Returns tree describing number of iterations determined from
 760     EXIT of DATA->current_loop, or NULL if something goes wrong.  */
 761
 762 static tree
 763 niter_for_exit (struct ivopts_data *data, edge exit)
 764 {
 765   struct nfe_cache_elt *nfe_desc;
 766   struct tree_niter_desc desc;
 767   PTR *slot;
 768
 769   slot = htab_find_slot_with_hash (data->niters, exit,
 770                                    htab_hash_pointer (exit),
 771                                    INSERT);
 772
 773   if (!*slot)
 774     {
 775       nfe_desc = xmalloc (sizeof (struct nfe_cache_elt));
 776       nfe_desc->exit = exit;
 777
 778       /* Try to determine number of iterations.  We must know it
 779          unconditionally (i.e., without possibility of # of iterations
 780          being zero).  Also, we cannot safely work with ssa names that
 781          appear in phi nodes on abnormal edges, so that we do not create
 782          overlapping life ranges for them (PR 27283).  */
 783       if (number_of_iterations_exit (data->current_loop,
 784                                      exit, &desc, true)
 785           && zero_p (desc.may_be_zero)
 786           && !contains_abnormal_ssa_name_p (desc.niter))
 787         nfe_desc->niter = desc.niter;
 788       else
 789         nfe_desc->niter = NULL_TREE;
 790     }
 791   else
 792     nfe_desc = *slot;
 793
 794   return nfe_desc->niter;
 795 }
 796
 797 /* Returns tree describing number of iterations determined from
 798    single dominating exit of DATA->current_loop, or NULL if something
 799    goes wrong.  */
 800
 801 static tree
 802 niter_for_single_dom_exit (struct ivopts_data *data)
 803 {
 804   edge exit = single_dom_exit (data->current_loop);
 805
 806   if (!exit)
 807     return NULL;
 808
 809   return niter_for_exit (data, exit);
 810 }
 811
 812 /* Initializes data structures used by the iv optimization pass, stored
 813    in DATA.  */
 814
 815 static void
 816 tree_ssa_iv_optimize_init (struct ivopts_data *data)
 817 {
 818   data->version_info_size = 2 * num_ssa_names;
 819   data->version_info = XCNEWVEC (struct version_info, data->version_info_size);
 820   data->relevant = BITMAP_ALLOC (NULL);
 821   data->important_candidates = BITMAP_ALLOC (NULL);
 822   data->max_inv_id = 0;
 823   data->niters = htab_create (10, nfe_hash, nfe_eq, free);
 824   data->iv_uses = VEC_alloc (iv_use_p, heap, 20);
 825   data->iv_candidates = VEC_alloc (iv_cand_p, heap, 20);
 826   decl_rtl_to_reset = VEC_alloc (tree, heap, 20);
 827 }
 828
 829 /* Returns a memory object to that EXPR points.  In case we are able to
 830    determine that it does not point to any such object, NULL is returned.  */
 831
 832 static tree
 833 determine_base_object (tree expr)
 834 {
 835   enum tree_code code = TREE_CODE (expr);
 836   tree base, obj, op0, op1;
 837
 838   if (!POINTER_TYPE_P (TREE_TYPE (expr)))
 839     return NULL_TREE;
 840
 841   switch (code)
 842     {
 843     case INTEGER_CST:
 844       return NULL_TREE;
 845
 846     case ADDR_EXPR:
 847       obj = TREE_OPERAND (expr, 0);
 848       base = get_base_address (obj);
 849
 850       if (!base)
 851         return expr;
 852
 853       if (TREE_CODE (base) == INDIRECT_REF)
 854         return determine_base_object (TREE_OPERAND (base, 0));
 855
 856       return fold_convert (ptr_type_node,
 857                            build_fold_addr_expr (base));
 858
 859     case PLUS_EXPR:
 860     case MINUS_EXPR:
 861       op0 = determine_base_object (TREE_OPERAND (expr, 0));
 862       op1 = determine_base_object (TREE_OPERAND (expr, 1));
 863
 864       if (!op1)
 865         return op0;
 866
 867       if (!op0)
 868         return (code == PLUS_EXPR
 869                 ? op1
 870                 : fold_build1 (NEGATE_EXPR, ptr_type_node, op1));
 871
 872       return fold_build2 (code, ptr_type_node, op0, op1);
 873
 874     case NOP_EXPR:
 875     case CONVERT_EXPR:
 876       return determine_base_object (TREE_OPERAND (expr, 0));
 877
 878     default:
 879       return fold_convert (ptr_type_node, expr);
 880     }
 881 }
 882
 883 /* Allocates an induction variable with given initial value BASE and step STEP
 884    for loop LOOP.  */
 885
 886 static struct iv *
 887 alloc_iv (tree base, tree step)
 888 {
 889   struct iv *iv = XCNEW (struct iv);
 890
 891   if (step && integer_zerop (step))
 892     step = NULL_TREE;
 893
 894   iv->base = base;
 895   iv->base_object = determine_base_object (base);
 896   iv->step = step;
 897   iv->biv_p = false;
 898   iv->have_use_for = false;
 899   iv->use_id = 0;
 900   iv->ssa_name = NULL_TREE;
 901
 902   return iv;
 903 }
 904
 905 /* Sets STEP and BASE for induction variable IV.  */
 906
 907 static void
 908 set_iv (struct ivopts_data *data, tree iv, tree base, tree step)
 909 {
 910   struct version_info *info = name_info (data, iv);
 911
 912   gcc_assert (!info->iv);
 913
 914   bitmap_set_bit (data->relevant, SSA_NAME_VERSION (iv));
 915   info->iv = alloc_iv (base, step);
 916   info->iv->ssa_name = iv;
 917 }
 918
 919 /* Finds induction variable declaration for VAR.  */
 920
 921 static struct iv *
 922 get_iv (struct ivopts_data *data, tree var)
 923 {
 924   basic_block bb;
 925
 926   if (!name_info (data, var)->iv)
 927     {
 928       bb = bb_for_stmt (SSA_NAME_DEF_STMT (var));
 929
 930       if (!bb
 931           || !flow_bb_inside_loop_p (data->current_loop, bb))
 932         set_iv (data, var, var, NULL_TREE);
 933     }
 934
 935   return name_info (data, var)->iv;
 936 }
 937
 938 /* Determines the step of a biv defined in PHI.  Returns NULL if PHI does
 939    not define a simple affine biv with nonzero step.  */
 940
 941 static tree
 942 determine_biv_step (tree phi)
 943 {
 944   struct loop *loop = bb_for_stmt (phi)->loop_father;
 945   tree name = PHI_RESULT (phi);
 946   affine_iv iv;
 947
 948   if (!is_gimple_reg (name))
 949     return NULL_TREE;
 950
 951   if (!simple_iv (loop, phi, name, &iv, true))
 952     return NULL_TREE;
 953
 954   return (zero_p (iv.step) ? NULL_TREE : iv.step);
 955 }
 956
 957 /* Finds basic ivs.  */
 958
 959 static bool
 960 find_bivs (struct ivopts_data *data)
 961 {
 962   tree phi, step, type, base;
 963   bool found = false;
 964   struct loop *loop = data->current_loop;
 965
 966   for (phi = phi_nodes (loop->header); phi; phi = PHI_CHAIN (phi))
 967     {
 968       if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi)))
 969         continue;
 970
 971       step = determine_biv_step (phi);
 972       if (!step)
 973         continue;
 974
 975       base = PHI_ARG_DEF_FROM_EDGE (phi, loop_preheader_edge (loop));
 976       base = expand_simple_operations (base);
 977       if (contains_abnormal_ssa_name_p (base)
 978           || contains_abnormal_ssa_name_p (step))
 979         continue;
 980
 981       type = TREE_TYPE (PHI_RESULT (phi));
 982       base = fold_convert (type, base);
 983       if (step)
 984         step = fold_convert (type, step);
 985
 986       set_iv (data, PHI_RESULT (phi), base, step);
 987       found = true;
 988     }
 989
 990   return found;
 991 }
 992
 993 /* Marks basic ivs.  */
 994
 995 static void
 996 mark_bivs (struct ivopts_data *data)
 997 {
 998   tree phi, var;
 999   struct iv *iv, *incr_iv;
1000   struct loop *loop = data->current_loop;
1001   basic_block incr_bb;
1002
1003   for (phi = phi_nodes (loop->header); phi; phi = PHI_CHAIN (phi))
1004     {
1005       iv = get_iv (data, PHI_RESULT (phi));
1006       if (!iv)
1007         continue;
1008
1009       var = PHI_ARG_DEF_FROM_EDGE (phi, loop_latch_edge (loop));
1010       incr_iv = get_iv (data, var);
1011       if (!incr_iv)
1012         continue;
1013
1014       /* If the increment is in the subloop, ignore it.  */
1015       incr_bb = bb_for_stmt (SSA_NAME_DEF_STMT (var));
1016       if (incr_bb->loop_father != data->current_loop
1017           || (incr_bb->flags & BB_IRREDUCIBLE_LOOP))
1018         continue;
1019
1020       iv->biv_p = true;
1021       incr_iv->biv_p = true;
1022     }
1023 }
1024
1025 /* Checks whether STMT defines a linear induction variable and stores its
1026    parameters to IV.  */
1027
1028 static bool
1029 find_givs_in_stmt_scev (struct ivopts_data *data, tree stmt, affine_iv *iv)
1030 {
1031   tree lhs;
1032   struct loop *loop = data->current_loop;
1033
1034   iv->base = NULL_TREE;
1035   iv->step = NULL_TREE;
1036
1037   if (TREE_CODE (stmt) != MODIFY_EXPR)
1038     return false;
1039
1040   lhs = TREE_OPERAND (stmt, 0);
1041   if (TREE_CODE (lhs) != SSA_NAME)
1042     return false;
1043
1044   if (!simple_iv (loop, stmt, TREE_OPERAND (stmt, 1), iv, true))
1045     return false;
1046   iv->base = expand_simple_operations (iv->base);
1047
1048   if (contains_abnormal_ssa_name_p (iv->base)
1049       || contains_abnormal_ssa_name_p (iv->step))
1050     return false;
1051
1052   return true;
1053 }
1054
1055 /* Finds general ivs in statement STMT.  */
1056
1057 static void
1058 find_givs_in_stmt (struct ivopts_data *data, tree stmt)
1059 {
1060   affine_iv iv;
1061
1062   if (!find_givs_in_stmt_scev (data, stmt, &iv))
1063     return;
1064
1065   set_iv (data, TREE_OPERAND (stmt, 0), iv.base, iv.step);
1066 }
1067
1068 /* Finds general ivs in basic block BB.  */
1069
1070 static void
1071 find_givs_in_bb (struct ivopts_data *data, basic_block bb)
1072 {
1073   block_stmt_iterator bsi;
1074
1075   for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
1076     find_givs_in_stmt (data, bsi_stmt (bsi));
1077 }
1078
1079 /* Finds general ivs.  */
1080
1081 static void
1082 find_givs (struct ivopts_data *data)
1083 {
1084   struct loop *loop = data->current_loop;
1085   basic_block *body = get_loop_body_in_dom_order (loop);
1086   unsigned i;
1087
1088   for (i = 0; i < loop->num_nodes; i++)
1089     find_givs_in_bb (data, body[i]);
1090   free (body);
1091 }
1092
1093 /* For each ssa name defined in LOOP determines whether it is an induction
1094    variable and if so, its initial value and step.  */
1095
1096 static bool
1097 find_induction_variables (struct ivopts_data *data)
1098 {
1099   unsigned i;
1100   bitmap_iterator bi;
1101
1102   if (!find_bivs (data))
1103     return false;
1104
1105   find_givs (data);
1106   mark_bivs (data);
1107
1108   if (dump_file && (dump_flags & TDF_DETAILS))
1109     {
1110       tree niter = niter_for_single_dom_exit (data);
1111
1112       if (niter)
1113         {
1114           fprintf (dump_file, "  number of iterations ");
1115           print_generic_expr (dump_file, niter, TDF_SLIM);
1116           fprintf (dump_file, "\n\n");
1117         };
1118
1119       fprintf (dump_file, "Induction variables:\n\n");
1120
1121       EXECUTE_IF_SET_IN_BITMAP (data->relevant, 0, i, bi)
1122         {
1123           if (ver_info (data, i)->iv)
1124             dump_iv (dump_file, ver_info (data, i)->iv);
1125         }
1126     }
1127
1128   return true;
1129 }
1130
1131 /* Records a use of type USE_TYPE at *USE_P in STMT whose value is IV.  */
1132
1133 static struct iv_use *
1134 record_use (struct ivopts_data *data, tree *use_p, struct iv *iv,
1135             tree stmt, enum use_type use_type)
1136 {
1137   struct iv_use *use = XCNEW (struct iv_use);
1138
1139   use->id = n_iv_uses (data);
1140   use->type = use_type;
1141   use->iv = iv;
1142   use->stmt = stmt;
1143   use->op_p = use_p;
1144   use->related_cands = BITMAP_ALLOC (NULL);
1145
1146   /* To avoid showing ssa name in the dumps, if it was not reset by the
1147      caller.  */
1148   iv->ssa_name = NULL_TREE;
1149
1150   if (dump_file && (dump_flags & TDF_DETAILS))
1151     dump_use (dump_file, use);
1152
1153   VEC_safe_push (iv_use_p, heap, data->iv_uses, use);
1154
1155   return use;
1156 }
1157
1158 /* Checks whether OP is a loop-level invariant and if so, records it.
1159    NONLINEAR_USE is true if the invariant is used in a way we do not
1160    handle specially.  */
1161
1162 static void
1163 record_invariant (struct ivopts_data *data, tree op, bool nonlinear_use)
1164 {
1165   basic_block bb;
1166   struct version_info *info;
1167
1168   if (TREE_CODE (op) != SSA_NAME
1169       || !is_gimple_reg (op))
1170     return;
1171
1172   bb = bb_for_stmt (SSA_NAME_DEF_STMT (op));
1173   if (bb
1174       && flow_bb_inside_loop_p (data->current_loop, bb))
1175     return;
1176
1177   info = name_info (data, op);
1178   info->name = op;
1179   info->has_nonlin_use |= nonlinear_use;
1180   if (!info->inv_id)
1181     info->inv_id = ++data->max_inv_id;
1182   bitmap_set_bit (data->relevant, SSA_NAME_VERSION (op));
1183 }
1184
1185 /* Checks whether the use OP is interesting and if so, records it.  */
1186
1187 static struct iv_use *
1188 find_interesting_uses_op (struct ivopts_data *data, tree op)
1189 {
1190   struct iv *iv;
1191   struct iv *civ;
1192   tree stmt;
1193   struct iv_use *use;
1194
1195   if (TREE_CODE (op) != SSA_NAME)
1196     return NULL;
1197
1198   iv = get_iv (data, op);
1199   if (!iv)
1200     return NULL;
1201
1202   if (iv->have_use_for)
1203     {
1204       use = iv_use (data, iv->use_id);
1205
1206       gcc_assert (use->type == USE_NONLINEAR_EXPR);
1207       return use;
1208     }
1209
1210   if (zero_p (iv->step))
1211     {
1212       record_invariant (data, op, true);
1213       return NULL;
1214     }
1215   iv->have_use_for = true;
1216
1217   civ = XNEW (struct iv);
1218   *civ = *iv;
1219
1220   stmt = SSA_NAME_DEF_STMT (op);
1221   gcc_assert (TREE_CODE (stmt) == PHI_NODE
1222               || TREE_CODE (stmt) == MODIFY_EXPR);
1223
1224   use = record_use (data, NULL, civ, stmt, USE_NONLINEAR_EXPR);
1225   iv->use_id = use->id;
1226
1227   return use;
1228 }
1229
1230 /* Checks whether the condition *COND_P in STMT is interesting
1231    and if so, records it.  */
1232
1233 static void
1234 find_interesting_uses_cond (struct ivopts_data *data, tree stmt, tree *cond_p)
1235 {
1236   tree *op0_p;
1237   tree *op1_p;
1238   struct iv *iv0 = NULL, *iv1 = NULL, *civ;
1239   struct iv const_iv;
1240   tree zero = integer_zero_node;
1241
1242   const_iv.step = NULL_TREE;
1243
1244   if (TREE_CODE (*cond_p) != SSA_NAME
1245       && !COMPARISON_CLASS_P (*cond_p))
1246     return;
1247
1248   if (TREE_CODE (*cond_p) == SSA_NAME)
1249     {
1250       op0_p = cond_p;
1251       op1_p = &zero;
1252     }
1253   else
1254     {
1255       op0_p = &TREE_OPERAND (*cond_p, 0);
1256       op1_p = &TREE_OPERAND (*cond_p, 1);
1257     }
1258
1259   if (TREE_CODE (*op0_p) == SSA_NAME)
1260     iv0 = get_iv (data, *op0_p);
1261   else
1262     iv0 = &const_iv;
1263
1264   if (TREE_CODE (*op1_p) == SSA_NAME)
1265     iv1 = get_iv (data, *op1_p);
1266   else
1267     iv1 = &const_iv;
1268
1269   if (/* When comparing with non-invariant value, we may not do any senseful
1270          induction variable elimination.  */
1271       (!iv0 || !iv1)
1272       /* Eliminating condition based on two ivs would be nontrivial.
1273          ??? TODO -- it is not really important to handle this case.  */
1274       || (!zero_p (iv0->step) && !zero_p (iv1->step)))
1275     {
1276       find_interesting_uses_op (data, *op0_p);
1277       find_interesting_uses_op (data, *op1_p);
1278       return;
1279     }
1280
1281   if (zero_p (iv0->step) && zero_p (iv1->step))
1282     {
1283       /* If both are invariants, this is a work for unswitching.  */
1284       return;
1285     }
1286
1287   civ = XNEW (struct iv);
1288   *civ = zero_p (iv0->step) ? *iv1: *iv0;
1289   record_use (data, cond_p, civ, stmt, USE_COMPARE);
1290 }
1291
1292 /* Returns true if expression EXPR is obviously invariant in LOOP,
1293    i.e. if all its operands are defined outside of the LOOP.  */
1294
1295 bool
1296 expr_invariant_in_loop_p (struct loop *loop, tree expr)
1297 {
1298   basic_block def_bb;
1299   unsigned i, len;
1300
1301   if (is_gimple_min_invariant (expr))
1302     return true;
1303
1304   if (TREE_CODE (expr) == SSA_NAME)
1305     {
1306       def_bb = bb_for_stmt (SSA_NAME_DEF_STMT (expr));
1307       if (def_bb
1308           && flow_bb_inside_loop_p (loop, def_bb))
1309         return false;
1310
1311       return true;
1312     }
1313
1314   if (!EXPR_P (expr))
1315     return false;
1316
1317   len = TREE_CODE_LENGTH (TREE_CODE (expr));
1318   for (i = 0; i < len; i++)
1319     if (!expr_invariant_in_loop_p (loop, TREE_OPERAND (expr, i)))
1320       return false;
1321
1322   return true;
1323 }
1324
1325 /* Cumulates the steps of indices into DATA and replaces their values with the
1326    initial ones.  Returns false when the value of the index cannot be determined.
1327    Callback for for_each_index.  */
1328
1329 struct ifs_ivopts_data
1330 {
1331   struct ivopts_data *ivopts_data;
1332   tree stmt;
1333   tree *step_p;
1334 };
1335
1336 static bool
1337 idx_find_step (tree base, tree *idx, void *data)
1338 {
1339   struct ifs_ivopts_data *dta = data;
1340   struct iv *iv;
1341   tree step, iv_base, iv_step, lbound, off;
1342   struct loop *loop = dta->ivopts_data->current_loop;
1343
1344   if (TREE_CODE (base) == MISALIGNED_INDIRECT_REF
1345       || TREE_CODE (base) == ALIGN_INDIRECT_REF)
1346     return false;
1347
1348   /* If base is a component ref, require that the offset of the reference
1349      be invariant.  */
1350   if (TREE_CODE (base) == COMPONENT_REF)
1351     {
1352       off = component_ref_field_offset (base);
1353       return expr_invariant_in_loop_p (loop, off);
1354     }
1355
1356   /* If base is array, first check whether we will be able to move the
1357      reference out of the loop (in order to take its address in strength
1358      reduction).  In order for this to work we need both lower bound
1359      and step to be loop invariants.  */
1360   if (TREE_CODE (base) == ARRAY_REF)
1361     {
1362       step = array_ref_element_size (base);
1363       lbound = array_ref_low_bound (base);
1364
1365       if (!expr_invariant_in_loop_p (loop, step)
1366           || !expr_invariant_in_loop_p (loop, lbound))
1367         return false;
1368     }
1369
1370   if (TREE_CODE (*idx) != SSA_NAME)
1371     return true;
1372
1373   iv = get_iv (dta->ivopts_data, *idx);
1374   if (!iv)
1375     return false;
1376
1377   /* XXX  We produce for a base of *D42 with iv->base being &x[0]
1378           *&x[0], which is not folded and does not trigger the
1379           ARRAY_REF path below.  */
1380   *idx = iv->base;
1381
1382   if (!iv->step)
1383     return true;
1384
1385   if (TREE_CODE (base) == ARRAY_REF)
1386     {
1387       step = array_ref_element_size (base);
1388
1389       /* We only handle addresses whose step is an integer constant.  */
1390       if (TREE_CODE (step) != INTEGER_CST)
1391         return false;
1392     }
1393   else
1394     /* The step for pointer arithmetics already is 1 byte.  */
1395     step = build_int_cst (sizetype, 1);
1396
1397   iv_base = iv->base;
1398   iv_step = iv->step;
1399   if (!convert_affine_scev (dta->ivopts_data->current_loop,
1400                             sizetype, &iv_base, &iv_step, dta->stmt,
1401                             false))
1402     {
1403       /* The index might wrap.  */
1404       return false;
1405     }
1406
1407   step = fold_build2 (MULT_EXPR, sizetype, step, iv_step);
1408
1409   if (!*dta->step_p)
1410     *dta->step_p = step;
1411   else
1412     *dta->step_p = fold_build2 (PLUS_EXPR, sizetype, *dta->step_p, step);
1413
1414   return true;
1415 }
1416
1417 /* Records use in index IDX.  Callback for for_each_index.  Ivopts data
1418    object is passed to it in DATA.  */
1419
1420 static bool
1421 idx_record_use (tree base, tree *idx,
1422                 void *data)
1423 {
1424   find_interesting_uses_op (data, *idx);
1425   if (TREE_CODE (base) == ARRAY_REF)
1426     {
1427       find_interesting_uses_op (data, array_ref_element_size (base));
1428       find_interesting_uses_op (data, array_ref_low_bound (base));
1429     }
1430   return true;
1431 }
1432
1433 /* Returns true if memory reference REF may be unaligned.  */
1434
1435 static bool
1436 may_be_unaligned_p (tree ref)
1437 {
1438   tree base;
1439   tree base_type;
1440   HOST_WIDE_INT bitsize;
1441   HOST_WIDE_INT bitpos;
1442   tree toffset;
1443   enum machine_mode mode;
1444   int unsignedp, volatilep;
1445   unsigned base_align;
1446
1447   /* TARGET_MEM_REFs are translated directly to valid MEMs on the target,
1448      thus they are not misaligned.  */
1449   if (TREE_CODE (ref) == TARGET_MEM_REF)
1450     return false;
1451
1452   /* The test below is basically copy of what expr.c:normal_inner_ref
1453      does to check whether the object must be loaded by parts when
1454      STRICT_ALIGNMENT is true.  */
1455   base = get_inner_reference (ref, &bitsize, &bitpos, &toffset, &mode,
1456                               &unsignedp, &volatilep, true);
1457   base_type = TREE_TYPE (base);
1458   base_align = TYPE_ALIGN (base_type);
1459
1460   if (mode != BLKmode
1461       && (base_align < GET_MODE_ALIGNMENT (mode)
1462           || bitpos % GET_MODE_ALIGNMENT (mode) != 0
1463           || bitpos % BITS_PER_UNIT != 0))
1464     return true;
1465
1466   return false;
1467 }
1468
1469 /* Return true if EXPR may be non-addressable.   */
1470
1471 static bool
1472 may_be_nonaddressable_p (tree expr)
1473 {
1474   switch (TREE_CODE (expr))
1475     {
1476     case COMPONENT_REF:
1477       return DECL_NONADDRESSABLE_P (TREE_OPERAND (expr, 1))
1478              || may_be_nonaddressable_p (TREE_OPERAND (expr, 0));
1479
1480     case ARRAY_REF:
1481     case ARRAY_RANGE_REF:
1482       return may_be_nonaddressable_p (TREE_OPERAND (expr, 0));
1483
1484     case VIEW_CONVERT_EXPR:
1485       /* This kind of view-conversions may wrap non-addressable objects
1486          and make them look addressable.  After some processing the
1487          non-addressability may be uncovered again, causing ADDR_EXPRs
1488          of inappropriate objects to be built.  */
1489       return AGGREGATE_TYPE_P (TREE_TYPE (expr))
1490              && !AGGREGATE_TYPE_P (TREE_TYPE (TREE_OPERAND (expr, 0)));
1491
1492     default:
1493       break;
1494     }
1495
1496   return false;
1497 }
1498
1499 /* Finds addresses in *OP_P inside STMT.  */
1500
1501 static void
1502 find_interesting_uses_address (struct ivopts_data *data, tree stmt, tree *op_p)
1503 {
1504   tree base = *op_p, step = NULL;
1505   struct iv *civ;
1506   struct ifs_ivopts_data ifs_ivopts_data;
1507
1508   /* Do not play with volatile memory references.  A bit too conservative,
1509      perhaps, but safe.  */
1510   if (stmt_ann (stmt)->has_volatile_ops)
1511     goto fail;
1512
1513   /* Ignore bitfields for now.  Not really something terribly complicated
1514      to handle.  TODO.  */
1515   if (TREE_CODE (base) == BIT_FIELD_REF)
1516     goto fail;
1517
1518   if (may_be_nonaddressable_p (base))
1519     goto fail;
1520
1521   if (STRICT_ALIGNMENT
1522       && may_be_unaligned_p (base))
1523     goto fail;
1524
1525   base = unshare_expr (base);
1526
1527   if (TREE_CODE (base) == TARGET_MEM_REF)
1528     {
1529       tree type = build_pointer_type (TREE_TYPE (base));
1530       tree astep;
1531
1532       if (TMR_BASE (base)
1533           && TREE_CODE (TMR_BASE (base)) == SSA_NAME)
1534         {
1535           civ = get_iv (data, TMR_BASE (base));
1536           if (!civ)
1537             goto fail;
1538
1539           TMR_BASE (base) = civ->base;
1540           step = civ->step;
1541         }
1542       if (TMR_INDEX (base)
1543           && TREE_CODE (TMR_INDEX (base)) == SSA_NAME)
1544         {
1545           civ = get_iv (data, TMR_INDEX (base));
1546           if (!civ)
1547             goto fail;
1548
1549           TMR_INDEX (base) = civ->base;
1550           astep = civ->step;
1551
1552           if (astep)
1553             {
1554               if (TMR_STEP (base))
1555                 astep = fold_build2 (MULT_EXPR, type, TMR_STEP (base), astep);
1556
1557               if (step)
1558                 step = fold_build2 (PLUS_EXPR, type, step, astep);
1559               else
1560                 step = astep;
1561             }
1562         }
1563
1564       if (zero_p (step))
1565         goto fail;
1566       base = tree_mem_ref_addr (type, base);
1567     }
1568   else
1569     {
1570       ifs_ivopts_data.ivopts_data = data;
1571       ifs_ivopts_data.stmt = stmt;
1572       ifs_ivopts_data.step_p = &step;
1573       if (!for_each_index (&base, idx_find_step, &ifs_ivopts_data)
1574           || zero_p (step))
1575         goto fail;
1576
1577       gcc_assert (TREE_CODE (base) != ALIGN_INDIRECT_REF);
1578       gcc_assert (TREE_CODE (base) != MISALIGNED_INDIRECT_REF);
1579
1580       base = build_fold_addr_expr (base);
1581
1582       /* Substituting bases of IVs into the base expression might
1583          have caused folding opportunities.  */
1584       if (TREE_CODE (base) == ADDR_EXPR)
1585         {
1586           tree *ref = &TREE_OPERAND (base, 0);
1587           while (handled_component_p (*ref))
1588             ref = &TREE_OPERAND (*ref, 0);
1589           if (TREE_CODE (*ref) == INDIRECT_REF)
1590             *ref = fold_indirect_ref (*ref);
1591         }
1592     }
1593
1594   civ = alloc_iv (base, step);
1595   record_use (data, op_p, civ, stmt, USE_ADDRESS);
1596   return;
1597
1598 fail:
1599   for_each_index (op_p, idx_record_use, data);
1600 }
1601
1602 /* Finds and records invariants used in STMT.  */
1603
1604 static void
1605 find_invariants_stmt (struct ivopts_data *data, tree stmt)
1606 {
1607   ssa_op_iter iter;
1608   use_operand_p use_p;
1609   tree op;
1610
1611   FOR_EACH_PHI_OR_STMT_USE (use_p, stmt, iter, SSA_OP_USE)
1612     {
1613       op = USE_FROM_PTR (use_p);
1614       record_invariant (data, op, false);
1615     }
1616 }
1617
1618 /* Finds interesting uses of induction variables in the statement STMT.  */
1619
1620 static void
1621 find_interesting_uses_stmt (struct ivopts_data *data, tree stmt)
1622 {
1623   struct iv *iv;
1624   tree op, lhs, rhs;
1625   ssa_op_iter iter;
1626   use_operand_p use_p;
1627
1628   find_invariants_stmt (data, stmt);
1629
1630   if (TREE_CODE (stmt) == COND_EXPR)
1631     {
1632       find_interesting_uses_cond (data, stmt, &COND_EXPR_COND (stmt));
1633       return;
1634     }
1635
1636   if (TREE_CODE (stmt) == MODIFY_EXPR)
1637     {
1638       lhs = TREE_OPERAND (stmt, 0);
1639       rhs = TREE_OPERAND (stmt, 1);
1640
1641       if (TREE_CODE (lhs) == SSA_NAME)
1642         {
1643           /* If the statement defines an induction variable, the uses are not
1644              interesting by themselves.  */
1645
1646           iv = get_iv (data, lhs);
1647
1648           if (iv && !zero_p (iv->step))
1649             return;
1650         }
1651
1652       switch (TREE_CODE_CLASS (TREE_CODE (rhs)))
1653         {
1654         case tcc_comparison:
1655           find_interesting_uses_cond (data, stmt, &TREE_OPERAND (stmt, 1));
1656           return;
1657
1658         case tcc_reference:
1659           find_interesting_uses_address (data, stmt, &TREE_OPERAND (stmt, 1));
1660           if (REFERENCE_CLASS_P (lhs))
1661             find_interesting_uses_address (data, stmt, &TREE_OPERAND (stmt, 0));
1662           return;
1663
1664         default: ;
1665         }
1666
1667       if (REFERENCE_CLASS_P (lhs)
1668           && is_gimple_val (rhs))
1669         {
1670           find_interesting_uses_address (data, stmt, &TREE_OPERAND (stmt, 0));
1671           find_interesting_uses_op (data, rhs);
1672           return;
1673         }
1674
1675       /* TODO -- we should also handle address uses of type
1676
1677          memory = call (whatever);
1678
1679          and
1680
1681          call (memory).  */
1682     }
1683
1684   if (TREE_CODE (stmt) == PHI_NODE
1685       && bb_for_stmt (stmt) == data->current_loop->header)
1686     {
1687       lhs = PHI_RESULT (stmt);
1688       iv = get_iv (data, lhs);
1689
1690       if (iv && !zero_p (iv->step))
1691         return;
1692     }
1693
1694   FOR_EACH_PHI_OR_STMT_USE (use_p, stmt, iter, SSA_OP_USE)
1695     {
1696       op = USE_FROM_PTR (use_p);
1697
1698       if (TREE_CODE (op) != SSA_NAME)
1699         continue;
1700
1701       iv = get_iv (data, op);
1702       if (!iv)
1703         continue;
1704
1705       find_interesting_uses_op (data, op);
1706     }
1707 }
1708
1709 /* Finds interesting uses of induction variables outside of loops
1710    on loop exit edge EXIT.  */
1711
1712 static void
1713 find_interesting_uses_outside (struct ivopts_data *data, edge exit)
1714 {
1715   tree phi, def;
1716
1717   for (phi = phi_nodes (exit->dest); phi; phi = PHI_CHAIN (phi))
1718     {
1719       def = PHI_ARG_DEF_FROM_EDGE (phi, exit);
1720       find_interesting_uses_op (data, def);
1721     }
1722 }
1723
1724 /* Finds uses of the induction variables that are interesting.  */
1725
1726 static void
1727 find_interesting_uses (struct ivopts_data *data)
1728 {
1729   basic_block bb;
1730   block_stmt_iterator bsi;
1731   tree phi;
1732   basic_block *body = get_loop_body (data->current_loop);
1733   unsigned i;
1734   struct version_info *info;
1735   edge e;
1736
1737   if (dump_file && (dump_flags & TDF_DETAILS))
1738     fprintf (dump_file, "Uses:\n\n");
1739
1740   for (i = 0; i < data->current_loop->num_nodes; i++)
1741     {
1742       edge_iterator ei;
1743       bb = body[i];
1744
1745       FOR_EACH_EDGE (e, ei, bb->succs)
1746         if (e->dest != EXIT_BLOCK_PTR
1747             && !flow_bb_inside_loop_p (data->current_loop, e->dest))
1748           find_interesting_uses_outside (data, e);
1749
1750       for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
1751         find_interesting_uses_stmt (data, phi);
1752       for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
1753         find_interesting_uses_stmt (data, bsi_stmt (bsi));
1754     }
1755
1756   if (dump_file && (dump_flags & TDF_DETAILS))
1757     {
1758       bitmap_iterator bi;
1759
1760       fprintf (dump_file, "\n");
1761
1762       EXECUTE_IF_SET_IN_BITMAP (data->relevant, 0, i, bi)
1763         {
1764           info = ver_info (data, i);
1765           if (info->inv_id)
1766             {
1767               fprintf (dump_file, "  ");
1768               print_generic_expr (dump_file, info->name, TDF_SLIM);
1769               fprintf (dump_file, " is invariant (%d)%s\n",
1770                        info->inv_id, info->has_nonlin_use ? "" : ", eliminable");
1771             }
1772         }
1773
1774       fprintf (dump_file, "\n");
1775     }
1776
1777   free (body);
1778 }
1779
1780 /* Strips constant offsets from EXPR and stores them to OFFSET.  If INSIDE_ADDR
1781    is true, assume we are inside an address.  If TOP_COMPREF is true, assume
1782    we are at the top-level of the processed address.  */
1783
1784 static tree
1785 strip_offset_1 (tree expr, bool inside_addr, bool top_compref,
1786                 unsigned HOST_WIDE_INT *offset)
1787 {
1788   tree op0 = NULL_TREE, op1 = NULL_TREE, tmp, step;
1789   enum tree_code code;
1790   tree type, orig_type = TREE_TYPE (expr);
1791   unsigned HOST_WIDE_INT off0, off1, st;
1792   tree orig_expr = expr;
1793
1794   STRIP_NOPS (expr);
1795
1796   type = TREE_TYPE (expr);
1797   code = TREE_CODE (expr);
1798   *offset = 0;
1799
1800   switch (code)
1801     {
1802     case INTEGER_CST:
1803       if (!cst_and_fits_in_hwi (expr)
1804           || zero_p (expr))
1805         return orig_expr;
1806
1807       *offset = int_cst_value (expr);
1808       return build_int_cst (orig_type, 0);
1809
1810     case PLUS_EXPR:
1811     case MINUS_EXPR:
1812       op0 = TREE_OPERAND (expr, 0);
1813       op1 = TREE_OPERAND (expr, 1);
1814
1815       op0 = strip_offset_1 (op0, false, false, &off0);
1816       op1 = strip_offset_1 (op1, false, false, &off1);
1817
1818       *offset = (code == PLUS_EXPR ? off0 + off1 : off0 - off1);
1819       if (op0 == TREE_OPERAND (expr, 0)
1820           && op1 == TREE_OPERAND (expr, 1))
1821         return orig_expr;
1822
1823       if (zero_p (op1))
1824         expr = op0;
1825       else if (zero_p (op0))
1826         {
1827           if (code == PLUS_EXPR)
1828             expr = op1;
1829           else
1830             expr = fold_build1 (NEGATE_EXPR, type, op1);
1831         }
1832       else
1833         expr = fold_build2 (code, type, op0, op1);
1834
1835       return fold_convert (orig_type, expr);
1836
1837     case ARRAY_REF:
1838       if (!inside_addr)
1839         return orig_expr;
1840
1841       step = array_ref_element_size (expr);
1842       if (!cst_and_fits_in_hwi (step))
1843         break;
1844
1845       st = int_cst_value (step);
1846       op1 = TREE_OPERAND (expr, 1);
1847       op1 = strip_offset_1 (op1, false, false, &off1);
1848       *offset = off1 * st;
1849
1850       if (top_compref
1851           && zero_p (op1))
1852         {
1853           /* Strip the component reference completely.  */
1854           op0 = TREE_OPERAND (expr, 0);
1855           op0 = strip_offset_1 (op0, inside_addr, top_compref, &off0);
1856           *offset += off0;
1857           return op0;
1858         }
1859       break;
1860
1861     case COMPONENT_REF:
1862       if (!inside_addr)
1863         return orig_expr;
1864
1865       tmp = component_ref_field_offset (expr);
1866       if (top_compref
1867           && cst_and_fits_in_hwi (tmp))
1868         {
1869           /* Strip the component reference completely.  */
1870           op0 = TREE_OPERAND (expr, 0);
1871           op0 = strip_offset_1 (op0, inside_addr, top_compref, &off0);
1872           *offset = off0 + int_cst_value (tmp);
1873           return op0;
1874         }
1875       break;
1876
1877     case ADDR_EXPR:
1878       op0 = TREE_OPERAND (expr, 0);
1879       op0 = strip_offset_1 (op0, true, true, &off0);
1880       *offset += off0;
1881
1882       if (op0 == TREE_OPERAND (expr, 0))
1883         return orig_expr;
1884
1885       expr = build_fold_addr_expr (op0);
1886       return fold_convert (orig_type, expr);
1887
1888     case INDIRECT_REF:
1889       inside_addr = false;
1890       break;
1891
1892     default:
1893       return orig_expr;
1894     }
1895
1896   /* Default handling of expressions for that we want to recurse into
1897      the first operand.  */
1898   op0 = TREE_OPERAND (expr, 0);
1899   op0 = strip_offset_1 (op0, inside_addr, false, &off0);
1900   *offset += off0;
1901
1902   if (op0 == TREE_OPERAND (expr, 0)
1903       && (!op1 || op1 == TREE_OPERAND (expr, 1)))
1904     return orig_expr;
1905
1906   expr = copy_node (expr);
1907   TREE_OPERAND (expr, 0) = op0;
1908   if (op1)
1909     TREE_OPERAND (expr, 1) = op1;
1910
1911   /* Inside address, we might strip the top level component references,
1912      thus changing type of the expression.  Handling of ADDR_EXPR
1913      will fix that.  */
1914   expr = fold_convert (orig_type, expr);
1915
1916   return expr;
1917 }
1918
1919 /* Strips constant offsets from EXPR and stores them to OFFSET.  */
1920
1921 static tree
1922 strip_offset (tree expr, unsigned HOST_WIDE_INT *offset)
1923 {
1924   return strip_offset_1 (expr, false, false, offset);
1925 }
1926
1927 /* Returns variant of TYPE that can be used as base for different uses.
1928    For integer types, we return unsigned variant of the type, which
1929    avoids problems with overflows.  For pointer types, we return void *.  */
1930
1931 static tree
1932 generic_type_for (tree type)
1933 {
1934   if (POINTER_TYPE_P (type))
1935     return ptr_type_node;
1936
1937   if (TYPE_UNSIGNED (type))
1938     return type;
1939
1940   return unsigned_type_for (type);
1941 }
1942
1943 /* Records invariants in *EXPR_P.  Callback for walk_tree.  DATA contains
1944    the bitmap to that we should store it.  */
1945
1946 static struct ivopts_data *fd_ivopts_data;
1947 static tree
1948 find_depends (tree *expr_p, int *ws ATTRIBUTE_UNUSED, void *data)
1949 {
1950   bitmap *depends_on = data;
1951   struct version_info *info;
1952
1953   if (TREE_CODE (*expr_p) != SSA_NAME)
1954     return NULL_TREE;
1955   info = name_info (fd_ivopts_data, *expr_p);
1956
1957   if (!info->inv_id || info->has_nonlin_use)
1958     return NULL_TREE;
1959
1960   if (!*depends_on)
1961     *depends_on = BITMAP_ALLOC (NULL);
1962   bitmap_set_bit (*depends_on, info->inv_id);
1963
1964   return NULL_TREE;
1965 }
1966
1967 /* Adds a candidate BASE + STEP * i.  Important field is set to IMPORTANT and
1968    position to POS.  If USE is not NULL, the candidate is set as related to
1969    it.  If both BASE and STEP are NULL, we add a pseudocandidate for the
1970    replacement of the final value of the iv by a direct computation.  */
1971
1972 static struct iv_cand *
1973 add_candidate_1 (struct ivopts_data *data,
1974                  tree base, tree step, bool important, enum iv_position pos,
1975                  struct iv_use *use, tree incremented_at)
1976 {
1977   unsigned i;
1978   struct iv_cand *cand = NULL;
1979   tree type, orig_type;
1980
1981   if (base)
1982     {
1983       orig_type = TREE_TYPE (base);
1984       type = generic_type_for (orig_type);
1985       if (type != orig_type)
1986         {
1987           base = fold_convert (type, base);
1988           if (step)
1989             step = fold_convert (type, step);
1990         }
1991     }
1992
1993   for (i = 0; i < n_iv_cands (data); i++)
1994     {
1995       cand = iv_cand (data, i);
1996
1997       if (cand->pos != pos)
1998         continue;
1999
2000       if (cand->incremented_at != incremented_at)
2001         continue;
2002
2003       if (!cand->iv)
2004         {
2005           if (!base && !step)
2006             break;
2007
2008           continue;
2009         }
2010
2011       if (!base && !step)
2012         continue;
2013
2014       if (!operand_equal_p (base, cand->iv->base, 0))
2015         continue;
2016
2017       if (zero_p (cand->iv->step))
2018         {
2019           if (zero_p (step))
2020             break;
2021         }
2022       else
2023         {
2024           if (step && operand_equal_p (step, cand->iv->step, 0))
2025             break;
2026         }
2027     }
2028
2029   if (i == n_iv_cands (data))
2030     {
2031       cand = XCNEW (struct iv_cand);
2032       cand->id = i;
2033
2034       if (!base && !step)
2035         cand->iv = NULL;
2036       else
2037         cand->iv = alloc_iv (base, step);
2038
2039       cand->pos = pos;
2040       if (pos != IP_ORIGINAL && cand->iv)
2041         {
2042           cand->var_before = create_tmp_var_raw (TREE_TYPE (base), "ivtmp");
2043           cand->var_after = cand->var_before;
2044         }
2045       cand->important = important;
2046       cand->incremented_at = incremented_at;
2047       VEC_safe_push (iv_cand_p, heap, data->iv_candidates, cand);
2048
2049       if (step
2050           && TREE_CODE (step) != INTEGER_CST)
2051         {
2052           fd_ivopts_data = data;
2053           walk_tree (&step, find_depends, &cand->depends_on, NULL);
2054         }
2055
2056       if (dump_file && (dump_flags & TDF_DETAILS))
2057         dump_cand (dump_file, cand);
2058     }
2059
2060   if (important && !cand->important)
2061     {
2062       cand->important = true;
2063       if (dump_file && (dump_flags & TDF_DETAILS))
2064         fprintf (dump_file, "Candidate %d is important\n", cand->id);
2065     }
2066
2067   if (use)
2068     {
2069       bitmap_set_bit (use->related_cands, i);
2070       if (dump_file && (dump_flags & TDF_DETAILS))
2071         fprintf (dump_file, "Candidate %d is related to use %d\n",
2072                  cand->id, use->id);
2073     }
2074
2075   return cand;
2076 }
2077
2078 /* Returns true if incrementing the induction variable at the end of the LOOP
2079    is allowed.
2080
2081    The purpose is to avoid splitting latch edge with a biv increment, thus
2082    creating a jump, possibly confusing other optimization passes and leaving
2083    less freedom to scheduler.  So we allow IP_END_POS only if IP_NORMAL_POS
2084    is not available (so we do not have a better alternative), or if the latch
2085    edge is already nonempty.  */
2086
2087 static bool
2088 allow_ip_end_pos_p (struct loop *loop)
2089 {
2090   if (!ip_normal_pos (loop))
2091     return true;
2092
2093   if (!empty_block_p (ip_end_pos (loop)))
2094     return true;
2095
2096   return false;
2097 }
2098
2099 /* Adds a candidate BASE + STEP * i.  Important field is set to IMPORTANT and
2100    position to POS.  If USE is not NULL, the candidate is set as related to
2101    it.  The candidate computation is scheduled on all available positions.  */
2102
2103 static void
2104 add_candidate (struct ivopts_data *data,
2105                tree base, tree step, bool important, struct iv_use *use)
2106 {
2107   if (ip_normal_pos (data->current_loop))
2108     add_candidate_1 (data, base, step, important, IP_NORMAL, use, NULL_TREE);
2109   if (ip_end_pos (data->current_loop)
2110       && allow_ip_end_pos_p (data->current_loop))
2111     add_candidate_1 (data, base, step, important, IP_END, use, NULL_TREE);
2112 }
2113
2114 /* Add a standard "0 + 1 * iteration" iv candidate for a
2115    type with SIZE bits.  */
2116
2117 static void
2118 add_standard_iv_candidates_for_size (struct ivopts_data *data,
2119                                      unsigned int size)
2120 {
2121   tree type = lang_hooks.types.type_for_size (size, true);
2122   add_candidate (data, build_int_cst (type, 0), build_int_cst (type, 1),
2123                  true, NULL);
2124 }
2125
2126 /* Adds standard iv candidates.  */
2127
2128 static void
2129 add_standard_iv_candidates (struct ivopts_data *data)
2130 {
2131   add_standard_iv_candidates_for_size (data, INT_TYPE_SIZE);
2132
2133   /* The same for a double-integer type if it is still fast enough.  */
2134   if (BITS_PER_WORD >= INT_TYPE_SIZE * 2)
2135     add_standard_iv_candidates_for_size (data, INT_TYPE_SIZE * 2);
2136 }
2137
2138
2139 /* Adds candidates bases on the old induction variable IV.  */
2140
2141 static void
2142 add_old_iv_candidates (struct ivopts_data *data, struct iv *iv)
2143 {
2144   tree phi, def;
2145   struct iv_cand *cand;
2146
2147   add_candidate (data, iv->base, iv->step, true, NULL);
2148
2149   /* The same, but with initial value zero.  */
2150   add_candidate (data,
2151                  build_int_cst (TREE_TYPE (iv->base), 0),
2152                  iv->step, true, NULL);
2153
2154   phi = SSA_NAME_DEF_STMT (iv->ssa_name);
2155   if (TREE_CODE (phi) == PHI_NODE)
2156     {
2157       /* Additionally record the possibility of leaving the original iv
2158          untouched.  */
2159       def = PHI_ARG_DEF_FROM_EDGE (phi, loop_latch_edge (data->current_loop));
2160       cand = add_candidate_1 (data,
2161                               iv->base, iv->step, true, IP_ORIGINAL, NULL,
2162                               SSA_NAME_DEF_STMT (def));
2163       cand->var_before = iv->ssa_name;
2164       cand->var_after = def;
2165     }
2166 }
2167
2168 /* Adds candidates based on the old induction variables.  */
2169
2170 static void
2171 add_old_ivs_candidates (struct ivopts_data *data)
2172 {
2173   unsigned i;
2174   struct iv *iv;
2175   bitmap_iterator bi;
2176
2177   EXECUTE_IF_SET_IN_BITMAP (data->relevant, 0, i, bi)
2178     {
2179       iv = ver_info (data, i)->iv;
2180       if (iv && iv->biv_p && !zero_p (iv->step))
2181         add_old_iv_candidates (data, iv);
2182     }
2183 }
2184
2185 /* Adds candidates based on the value of the induction variable IV and USE.  */
2186
2187 static void
2188 add_iv_value_candidates (struct ivopts_data *data,
2189                          struct iv *iv, struct iv_use *use)
2190 {
2191   unsigned HOST_WIDE_INT offset;
2192   tree base;
2193
2194   add_candidate (data, iv->base, iv->step, false, use);
2195
2196   /* The same, but with initial value zero.  Make such variable important,
2197      since it is generic enough so that possibly many uses may be based
2198      on it.  */
2199   add_candidate (data, build_int_cst (TREE_TYPE (iv->base), 0),
2200                  iv->step, true, use);
2201
2202   /* Third, try removing the constant offset.  */
2203   base = strip_offset (iv->base, &offset);
2204   if (offset)
2205     add_candidate (data, base, iv->step, false, use);
2206 }
2207
2208 /* Adds candidates based on the uses.  */
2209
2210 static void
2211 add_derived_ivs_candidates (struct ivopts_data *data)
2212 {
2213   unsigned i;
2214
2215   for (i = 0; i < n_iv_uses (data); i++)
2216     {
2217       struct iv_use *use = iv_use (data, i);
2218
2219       if (!use)
2220         continue;
2221
2222       switch (use->type)
2223         {
2224         case USE_NONLINEAR_EXPR:
2225         case USE_COMPARE:
2226         case USE_ADDRESS:
2227           /* Just add the ivs based on the value of the iv used here.  */
2228           add_iv_value_candidates (data, use->iv, use);
2229           break;
2230
2231         default:
2232           gcc_unreachable ();
2233         }
2234     }
2235 }
2236
2237 /* Record important candidates and add them to related_cands bitmaps
2238    if needed.  */
2239
2240 static void
2241 record_important_candidates (struct ivopts_data *data)
2242 {
2243   unsigned i;
2244   struct iv_use *use;
2245
2246   for (i = 0; i < n_iv_cands (data); i++)
2247     {
2248       struct iv_cand *cand = iv_cand (data, i);
2249
2250       if (cand->important)
2251         bitmap_set_bit (data->important_candidates, i);
2252     }
2253
2254   data->consider_all_candidates = (n_iv_cands (data)
2255                                    <= CONSIDER_ALL_CANDIDATES_BOUND);
2256
2257   if (data->consider_all_candidates)
2258     {
2259       /* We will not need "related_cands" bitmaps in this case,
2260          so release them to decrease peak memory consumption.  */
2261       for (i = 0; i < n_iv_uses (data); i++)
2262         {
2263           use = iv_use (data, i);
2264           BITMAP_FREE (use->related_cands);
2265         }
2266     }
2267   else
2268     {
2269       /* Add important candidates to the related_cands bitmaps.  */
2270       for (i = 0; i < n_iv_uses (data); i++)
2271         bitmap_ior_into (iv_use (data, i)->related_cands,
2272                          data->important_candidates);
2273     }
2274 }
2275
2276 /* Finds the candidates for the induction variables.  */
2277
2278 static void
2279 find_iv_candidates (struct ivopts_data *data)
2280 {
2281   /* Add commonly used ivs.  */
2282   add_standard_iv_candidates (data);
2283
2284   /* Add old induction variables.  */
2285   add_old_ivs_candidates (data);
2286
2287   /* Add induction variables derived from uses.  */
2288   add_derived_ivs_candidates (data);
2289
2290   /* Record the important candidates.  */
2291   record_important_candidates (data);
2292 }
2293
2294 /* Allocates the data structure mapping the (use, candidate) pairs to costs.
2295    If consider_all_candidates is true, we use a two-dimensional array, otherwise
2296    we allocate a simple list to every use.  */
2297
2298 static void
2299 alloc_use_cost_map (struct ivopts_data *data)
2300 {
2301   unsigned i, size, s, j;
2302
2303   for (i = 0; i < n_iv_uses (data); i++)
2304     {
2305       struct iv_use *use = iv_use (data, i);
2306       bitmap_iterator bi;
2307
2308       if (data->consider_all_candidates)
2309         size = n_iv_cands (data);
2310       else
2311         {
2312           s = 0;
2313           EXECUTE_IF_SET_IN_BITMAP (use->related_cands, 0, j, bi)
2314             {
2315               s++;
2316             }
2317
2318           /* Round up to the power of two, so that moduling by it is fast.  */
2319           for (size = 1; size < s; size <<= 1)
2320             continue;
2321         }
2322
2323       use->n_map_members = size;
2324       use->cost_map = XCNEWVEC (struct cost_pair, size);
2325     }
2326 }
2327
2328 /* Sets cost of (USE, CANDIDATE) pair to COST and record that it depends
2329    on invariants DEPENDS_ON and that the value used in expressing it
2330    is VALUE.*/
2331
2332 static void
2333 set_use_iv_cost (struct ivopts_data *data,
2334                  struct iv_use *use, struct iv_cand *cand, unsigned cost,
2335                  bitmap depends_on, tree value)
2336 {
2337   unsigned i, s;
2338
2339   if (cost == INFTY)
2340     {
2341       BITMAP_FREE (depends_on);
2342       return;
2343     }
2344
2345   if (data->consider_all_candidates)
2346     {
2347       use->cost_map[cand->id].cand = cand;
2348       use->cost_map[cand->id].cost = cost;
2349       use->cost_map[cand->id].depends_on = depends_on;
2350       use->cost_map[cand->id].value = value;
2351       return;
2352     }
2353
2354   /* n_map_members is a power of two, so this computes modulo.  */
2355   s = cand->id & (use->n_map_members - 1);
2356   for (i = s; i < use->n_map_members; i++)
2357     if (!use->cost_map[i].cand)
2358       goto found;
2359   for (i = 0; i < s; i++)
2360     if (!use->cost_map[i].cand)
2361       goto found;
2362
2363   gcc_unreachable ();
2364
2365 found:
2366   use->cost_map[i].cand = cand;
2367   use->cost_map[i].cost = cost;
2368   use->cost_map[i].depends_on = depends_on;
2369   use->cost_map[i].value = value;
2370 }
2371
2372 /* Gets cost of (USE, CANDIDATE) pair.  */
2373
2374 static struct cost_pair *
2375 get_use_iv_cost (struct ivopts_data *data, struct iv_use *use,
2376                  struct iv_cand *cand)
2377 {
2378   unsigned i, s;
2379   struct cost_pair *ret;
2380
2381   if (!cand)
2382     return NULL;
2383
2384   if (data->consider_all_candidates)
2385     {
2386       ret = use->cost_map + cand->id;
2387       if (!ret->cand)
2388         return NULL;
2389
2390       return ret;
2391     }
2392
2393   /* n_map_members is a power of two, so this computes modulo.  */
2394   s = cand->id & (use->n_map_members - 1);
2395   for (i = s; i < use->n_map_members; i++)
2396     if (use->cost_map[i].cand == cand)
2397       return use->cost_map + i;
2398
2399   for (i = 0; i < s; i++)
2400     if (use->cost_map[i].cand == cand)
2401       return use->cost_map + i;
2402
2403   return NULL;
2404 }
2405
2406 /* Returns estimate on cost of computing SEQ.  */
2407
2408 static unsigned
2409 seq_cost (rtx seq)
2410 {
2411   unsigned cost = 0;
2412   rtx set;
2413
2414   for (; seq; seq = NEXT_INSN (seq))
2415     {
2416       set = single_set (seq);
2417       if (set)
2418         cost += rtx_cost (set, SET);
2419       else
2420         cost++;
2421     }
2422
2423   return cost;
2424 }
2425
2426 /* Produce DECL_RTL for object obj so it looks like it is stored in memory.  */
2427 static rtx
2428 produce_memory_decl_rtl (tree obj, int *regno)
2429 {
2430   rtx x;
2431
2432   gcc_assert (obj);
2433   if (TREE_STATIC (obj) || DECL_EXTERNAL (obj))
2434     {
2435       const char *name = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (obj));
2436       x = gen_rtx_SYMBOL_REF (Pmode, name);
2437     }
2438   else
2439     x = gen_raw_REG (Pmode, (*regno)++);
2440
2441   return gen_rtx_MEM (DECL_MODE (obj), x);
2442 }
2443
2444 /* Prepares decl_rtl for variables referred in *EXPR_P.  Callback for
2445    walk_tree.  DATA contains the actual fake register number.  */
2446
2447 static tree
2448 prepare_decl_rtl (tree *expr_p, int *ws, void *data)
2449 {
2450   tree obj = NULL_TREE;
2451   rtx x = NULL_RTX;
2452   int *regno = data;
2453
2454   switch (TREE_CODE (*expr_p))
2455     {
2456     case ADDR_EXPR:
2457       for (expr_p = &TREE_OPERAND (*expr_p, 0);
2458            handled_component_p (*expr_p);
2459            expr_p = &TREE_OPERAND (*expr_p, 0))
2460         continue;
2461       obj = *expr_p;
2462       if (DECL_P (obj) && !DECL_RTL_SET_P (obj))
2463         x = produce_memory_decl_rtl (obj, regno);
2464       break;
2465
2466     case SSA_NAME:
2467       *ws = 0;
2468       obj = SSA_NAME_VAR (*expr_p);
2469       if (!DECL_RTL_SET_P (obj))
2470         x = gen_raw_REG (DECL_MODE (obj), (*regno)++);
2471       break;
2472
2473     case VAR_DECL:
2474     case PARM_DECL:
2475     case RESULT_DECL:
2476       *ws = 0;
2477       obj = *expr_p;
2478
2479       if (DECL_RTL_SET_P (obj))
2480         break;
2481
2482       if (DECL_MODE (obj) == BLKmode)
2483         x = produce_memory_decl_rtl (obj, regno);
2484       else
2485         x = gen_raw_REG (DECL_MODE (obj), (*regno)++);
2486
2487       break;
2488
2489     default:
2490       break;
2491     }
2492
2493   if (x)
2494     {
2495       VEC_safe_push (tree, heap, decl_rtl_to_reset, obj);
2496       SET_DECL_RTL (obj, x);
2497     }
2498
2499   return NULL_TREE;
2500 }
2501
2502 /* Determines cost of the computation of EXPR.  */
2503
2504 static unsigned
2505 computation_cost (tree expr)
2506 {
2507   rtx seq, rslt;
2508   tree type = TREE_TYPE (expr);
2509   unsigned cost;
2510   /* Avoid using hard regs in ways which may be unsupported.  */
2511   int regno = LAST_VIRTUAL_REGISTER + 1;
2512
2513   walk_tree (&expr, prepare_decl_rtl, &regno, NULL);
2514   start_sequence ();
2515   rslt = expand_expr (expr, NULL_RTX, TYPE_MODE (type), EXPAND_NORMAL);
2516   seq = get_insns ();
2517   end_sequence ();
2518
2519   cost = seq_cost (seq);
2520   if (MEM_P (rslt))
2521     cost += address_cost (XEXP (rslt, 0), TYPE_MODE (type));
2522
2523   return cost;
2524 }
2525
2526 /* Returns variable containing the value of candidate CAND at statement AT.  */
2527
2528 static tree
2529 var_at_stmt (struct loop *loop, struct iv_cand *cand, tree stmt)
2530 {
2531   if (stmt_after_increment (loop, cand, stmt))
2532     return cand->var_after;
2533   else
2534     return cand->var_before;
2535 }
2536
2537 /* Return the most significant (sign) bit of T.  Similar to tree_int_cst_msb,
2538    but the bit is determined from TYPE_PRECISION, not MODE_BITSIZE.  */
2539
2540 int
2541 tree_int_cst_sign_bit (tree t)
2542 {
2543   unsigned bitno = TYPE_PRECISION (TREE_TYPE (t)) - 1;
2544   unsigned HOST_WIDE_INT w;
2545
2546   if (bitno < HOST_BITS_PER_WIDE_INT)
2547     w = TREE_INT_CST_LOW (t);
2548   else
2549     {
2550       w = TREE_INT_CST_HIGH (t);
2551       bitno -= HOST_BITS_PER_WIDE_INT;
2552     }
2553
2554   return (w >> bitno) & 1;
2555 }
2556
2557 /* If we can prove that TOP = cst * BOT for some constant cst in TYPE,
2558    return cst.  Otherwise return NULL_TREE.  */
2559
2560 static tree
2561 constant_multiple_of (tree type, tree top, tree bot)
2562 {
2563   tree res, mby, p0, p1;
2564   enum tree_code code;
2565   bool negate;
2566
2567   STRIP_NOPS (top);
2568   STRIP_NOPS (bot);
2569
2570   if (operand_equal_p (top, bot, 0))
2571     return build_int_cst (type, 1);
2572
2573   code = TREE_CODE (top);
2574   switch (code)
2575     {
2576     case MULT_EXPR:
2577       mby = TREE_OPERAND (top, 1);
2578       if (TREE_CODE (mby) != INTEGER_CST)
2579         return NULL_TREE;
2580
2581       res = constant_multiple_of (type, TREE_OPERAND (top, 0), bot);
2582       if (!res)
2583         return NULL_TREE;
2584
2585       return fold_binary_to_constant (MULT_EXPR, type, res,
2586                                       fold_convert (type, mby));
2587
2588     case PLUS_EXPR:
2589     case MINUS_EXPR:
2590       p0 = constant_multiple_of (type, TREE_OPERAND (top, 0), bot);
2591       if (!p0)
2592         return NULL_TREE;
2593       p1 = constant_multiple_of (type, TREE_OPERAND (top, 1), bot);
2594       if (!p1)
2595         return NULL_TREE;
2596
2597       return fold_binary_to_constant (code, type, p0, p1);
2598
2599     case INTEGER_CST:
2600       if (TREE_CODE (bot) != INTEGER_CST)
2601         return NULL_TREE;
2602
2603       bot = fold_convert (type, bot);
2604       top = fold_convert (type, top);
2605
2606       /* If BOT seems to be negative, try dividing by -BOT instead, and negate
2607          the result afterwards.  */
2608       if (tree_int_cst_sign_bit (bot))
2609         {
2610           negate = true;
2611           bot = fold_unary_to_constant (NEGATE_EXPR, type, bot);
2612         }
2613       else
2614         negate = false;
2615
2616       /* Ditto for TOP.  */
2617       if (tree_int_cst_sign_bit (top))
2618         {
2619           negate = !negate;
2620           top = fold_unary_to_constant (NEGATE_EXPR, type, top);
2621         }
2622
2623       if (!zero_p (fold_binary_to_constant (TRUNC_MOD_EXPR, type, top, bot)))
2624         return NULL_TREE;
2625
2626       res = fold_binary_to_constant (EXACT_DIV_EXPR, type, top, bot);
2627       if (negate)
2628         res = fold_unary_to_constant (NEGATE_EXPR, type, res);
2629       return res;
2630
2631     default:
2632       return NULL_TREE;
2633     }
2634 }
2635
2636 /* Sets COMB to CST.  */
2637
2638 static void
2639 aff_combination_const (struct affine_tree_combination *comb, tree type,
2640                        unsigned HOST_WIDE_INT cst)
2641 {
2642   unsigned prec = TYPE_PRECISION (type);
2643
2644   comb->type = type;
2645   comb->mask = (((unsigned HOST_WIDE_INT) 2 << (prec - 1)) - 1);
2646
2647   comb->n = 0;
2648   comb->rest = NULL_TREE;
2649   comb->offset = cst & comb->mask;
2650 }
2651
2652 /* Sets COMB to single element ELT.  */
2653
2654 static void
2655 aff_combination_elt (struct affine_tree_combination *comb, tree type, tree elt)
2656 {
2657   unsigned prec = TYPE_PRECISION (type);
2658
2659   comb->type = type;
2660   comb->mask = (((unsigned HOST_WIDE_INT) 2 << (prec - 1)) - 1);
2661
2662   comb->n = 1;
2663   comb->elts[0] = elt;
2664   comb->coefs[0] = 1;
2665   comb->rest = NULL_TREE;
2666   comb->offset = 0;
2667 }
2668
2669 /* Scales COMB by SCALE.  */
2670
2671 static void
2672 aff_combination_scale (struct affine_tree_combination *comb,
2673                        unsigned HOST_WIDE_INT scale)
2674 {
2675   unsigned i, j;
2676
2677   if (scale == 1)
2678     return;
2679
2680   if (scale == 0)
2681     {
2682       aff_combination_const (comb, comb->type, 0);
2683       return;
2684     }
2685
2686   comb->offset = (scale * comb->offset) & comb->mask;
2687   for (i = 0, j = 0; i < comb->n; i++)
2688     {
2689       comb->coefs[j] = (scale * comb->coefs[i]) & comb->mask;
2690       comb->elts[j] = comb->elts[i];
2691       if (comb->coefs[j] != 0)
2692         j++;
2693     }
2694   comb->n = j;
2695
2696   if (comb->rest)
2697     {
2698       if (comb->n < MAX_AFF_ELTS)
2699         {
2700           comb->coefs[comb->n] = scale;
2701           comb->elts[comb->n] = comb->rest;
2702           comb->rest = NULL_TREE;
2703           comb->n++;
2704         }
2705       else
2706         comb->rest = fold_build2 (MULT_EXPR, comb->type, comb->rest,
2707                                   build_int_cst_type (comb->type, scale));
2708     }
2709 }
2710
2711 /* Adds ELT * SCALE to COMB.  */
2712
2713 static void
2714 aff_combination_add_elt (struct affine_tree_combination *comb, tree elt,
2715                          unsigned HOST_WIDE_INT scale)
2716 {
2717   unsigned i;
2718
2719   if (scale == 0)
2720     return;
2721
2722   for (i = 0; i < comb->n; i++)
2723     if (operand_equal_p (comb->elts[i], elt, 0))
2724       {
2725         comb->coefs[i] = (comb->coefs[i] + scale) & comb->mask;
2726         if (comb->coefs[i])
2727           return;
2728
2729         comb->n--;
2730         comb->coefs[i] = comb->coefs[comb->n];
2731         comb->elts[i] = comb->elts[comb->n];
2732
2733         if (comb->rest)
2734           {
2735             gcc_assert (comb->n == MAX_AFF_ELTS - 1);
2736             comb->coefs[comb->n] = 1;
2737             comb->elts[comb->n] = comb->rest;
2738             comb->rest = NULL_TREE;
2739             comb->n++;
2740           }
2741         return;
2742       }
2743   if (comb->n < MAX_AFF_ELTS)
2744     {
2745       comb->coefs[comb->n] = scale;
2746       comb->elts[comb->n] = elt;
2747       comb->n++;
2748       return;
2749     }
2750
2751   if (scale == 1)
2752     elt = fold_convert (comb->type, elt);
2753   else
2754     elt = fold_build2 (MULT_EXPR, comb->type,
2755                        fold_convert (comb->type, elt),
2756                        build_int_cst_type (comb->type, scale));
2757
2758   if (comb->rest)
2759     comb->rest = fold_build2 (PLUS_EXPR, comb->type, comb->rest, elt);
2760   else
2761     comb->rest = elt;
2762 }
2763
2764 /* Adds COMB2 to COMB1.  */
2765
2766 static void
2767 aff_combination_add (struct affine_tree_combination *comb1,
2768                      struct affine_tree_combination *comb2)
2769 {
2770   unsigned i;
2771
2772   comb1->offset = (comb1->offset + comb2->offset) & comb1->mask;
2773   for (i = 0; i < comb2->n; i++)
2774     aff_combination_add_elt (comb1, comb2->elts[i], comb2->coefs[i]);
2775   if (comb2->rest)
2776     aff_combination_add_elt (comb1, comb2->rest, 1);
2777 }
2778
2779 /* Splits EXPR into an affine combination of parts.  */
2780
2781 static void
2782 tree_to_aff_combination (tree expr, tree type,
2783                          struct affine_tree_combination *comb)
2784 {
2785   struct affine_tree_combination tmp;
2786   enum tree_code code;
2787   tree cst, core, toffset;
2788   HOST_WIDE_INT bitpos, bitsize;
2789   enum machine_mode mode;
2790   int unsignedp, volatilep;
2791
2792   STRIP_NOPS (expr);
2793
2794   code = TREE_CODE (expr);
2795   switch (code)
2796     {
2797     case INTEGER_CST:
2798       aff_combination_const (comb, type, int_cst_value (expr));
2799       return;
2800
2801     case PLUS_EXPR:
2802     case MINUS_EXPR:
2803       tree_to_aff_combination (TREE_OPERAND (expr, 0), type, comb);
2804       tree_to_aff_combination (TREE_OPERAND (expr, 1), type, &tmp);
2805       if (code == MINUS_EXPR)
2806         aff_combination_scale (&tmp, -1);
2807       aff_combination_add (comb, &tmp);
2808       return;
2809
2810     case MULT_EXPR:
2811       cst = TREE_OPERAND (expr, 1);
2812       if (TREE_CODE (cst) != INTEGER_CST)
2813         break;
2814       tree_to_aff_combination (TREE_OPERAND (expr, 0), type, comb);
2815       aff_combination_scale (comb, int_cst_value (cst));
2816       return;
2817
2818     case NEGATE_EXPR:
2819       tree_to_aff_combination (TREE_OPERAND (expr, 0), type, comb);
2820       aff_combination_scale (comb, -1);
2821       return;
2822
2823     case ADDR_EXPR:
2824       core = get_inner_reference (TREE_OPERAND (expr, 0), &bitsize, &bitpos,
2825                                   &toffset, &mode, &unsignedp, &volatilep,
2826                                   false);
2827       if (bitpos % BITS_PER_UNIT != 0)
2828         break;
2829       aff_combination_const (comb, type, bitpos / BITS_PER_UNIT);
2830       core = build_fold_addr_expr (core);
2831       if (TREE_CODE (core) == ADDR_EXPR)
2832         aff_combination_add_elt (comb, core, 1);
2833       else
2834         {
2835           tree_to_aff_combination (core, type, &tmp);
2836           aff_combination_add (comb, &tmp);
2837         }
2838       if (toffset)
2839         {
2840           tree_to_aff_combination (toffset, type, &tmp);
2841           aff_combination_add (comb, &tmp);
2842         }
2843       return;
2844
2845     default:
2846       break;
2847     }
2848
2849   aff_combination_elt (comb, type, expr);
2850 }
2851
2852 /* Creates EXPR + ELT * SCALE in TYPE.  MASK is the mask for width of TYPE.  */
2853
2854 static tree
2855 add_elt_to_tree (tree expr, tree type, tree elt, unsigned HOST_WIDE_INT scale,
2856                  unsigned HOST_WIDE_INT mask)
2857 {
2858   enum tree_code code;
2859
2860   scale &= mask;
2861   elt = fold_convert (type, elt);
2862
2863   if (scale == 1)
2864     {
2865       if (!expr)
2866         return elt;
2867
2868       return fold_build2 (PLUS_EXPR, type, expr, elt);
2869     }
2870
2871   if (scale == mask)
2872     {
2873       if (!expr)
2874         return fold_build1 (NEGATE_EXPR, type, elt);
2875
2876       return fold_build2 (MINUS_EXPR, type, expr, elt);
2877     }
2878
2879   if (!expr)
2880     return fold_build2 (MULT_EXPR, type, elt,
2881                         build_int_cst_type (type, scale));
2882
2883   if ((scale | (mask >> 1)) == mask)
2884     {
2885       /* Scale is negative.  */
2886       code = MINUS_EXPR;
2887       scale = (-scale) & mask;
2888     }
2889   else
2890     code = PLUS_EXPR;
2891
2892   elt = fold_build2 (MULT_EXPR, type, elt,
2893                      build_int_cst_type (type, scale));
2894   return fold_build2 (code, type, expr, elt);
2895 }
2896
2897 /* Copies the tree elements of COMB to ensure that they are not shared.  */
2898
2899 static void
2900 unshare_aff_combination (struct affine_tree_combination *comb)
2901 {
2902   unsigned i;
2903
2904   for (i = 0; i < comb->n; i++)
2905     comb->elts[i] = unshare_expr (comb->elts[i]);
2906   if (comb->rest)
2907     comb->rest = unshare_expr (comb->rest);
2908 }
2909
2910 /* Makes tree from the affine combination COMB.  */
2911
2912 static tree
2913 aff_combination_to_tree (struct affine_tree_combination *comb)
2914 {
2915   tree type = comb->type;
2916   tree expr = comb->rest;
2917   unsigned i;
2918   unsigned HOST_WIDE_INT off, sgn;
2919
2920   if (comb->n == 0 && comb->offset == 0)
2921     {
2922       if (expr)
2923         {
2924           /* Handle the special case produced by get_computation_aff when
2925              the type does not fit in HOST_WIDE_INT.  */
2926           return fold_convert (type, expr);
2927         }
2928       else
2929         return build_int_cst (type, 0);
2930     }
2931
2932   gcc_assert (comb->n == MAX_AFF_ELTS || comb->rest == NULL_TREE);
2933
2934   for (i = 0; i < comb->n; i++)
2935     expr = add_elt_to_tree (expr, type, comb->elts[i], comb->coefs[i],
2936                             comb->mask);
2937
2938   if ((comb->offset | (comb->mask >> 1)) == comb->mask)
2939     {
2940       /* Offset is negative.  */
2941       off = (-comb->offset) & comb->mask;
2942       sgn = comb->mask;
2943     }
2944   else
2945     {
2946       off = comb->offset;
2947       sgn = 1;
2948     }
2949   return add_elt_to_tree (expr, type, build_int_cst_type (type, off), sgn,
2950                           comb->mask);
2951 }
2952
2953 /* Folds EXPR using the affine expressions framework.  */
2954
2955 static tree
2956 fold_affine_expr (tree expr)
2957 {
2958   tree type = TREE_TYPE (expr);
2959   struct affine_tree_combination comb;
2960
2961   if (TYPE_PRECISION (type) > HOST_BITS_PER_WIDE_INT)
2962     return expr;
2963
2964   tree_to_aff_combination (expr, type, &comb);
2965   return aff_combination_to_tree (&comb);
2966 }
2967
2968 /* Determines the expression by that USE is expressed from induction variable
2969    CAND at statement AT in LOOP.  The expression is stored in a decomposed
2970    form into AFF.  Returns false if USE cannot be expressed using CAND.  */
2971
2972 static bool
2973 get_computation_aff (struct loop *loop,
2974                      struct iv_use *use, struct iv_cand *cand, tree at,
2975                      struct affine_tree_combination *aff)
2976 {
2977   tree ubase = use->iv->base;
2978   tree ustep = use->iv->step;
2979   tree cbase = cand->iv->base;
2980   tree cstep = cand->iv->step;
2981   tree utype = TREE_TYPE (ubase), ctype = TREE_TYPE (cbase);
2982   tree uutype;
2983   tree expr, delta;
2984   tree ratio;
2985   unsigned HOST_WIDE_INT ustepi, cstepi;
2986   HOST_WIDE_INT ratioi;
2987   struct affine_tree_combination cbase_aff, expr_aff;
2988   tree cstep_orig = cstep, ustep_orig = ustep;
2989
2990   if (TYPE_PRECISION (utype) > TYPE_PRECISION (ctype))
2991     {
2992       /* We do not have a precision to express the values of use.  */
2993       return false;
2994     }
2995
2996   expr = var_at_stmt (loop, cand, at);
2997
2998   if (TREE_TYPE (expr) != ctype)
2999     {
3000       /* This may happen with the original ivs.  */
3001       expr = fold_convert (ctype, expr);
3002     }
3003
3004   if (TYPE_UNSIGNED (utype))
3005     uutype = utype;
3006   else
3007     {
3008       uutype = unsigned_type_for (utype);
3009       ubase = fold_convert (uutype, ubase);
3010       ustep = fold_convert (uutype, ustep);
3011     }
3012
3013   if (uutype != ctype)
3014     {
3015       expr = fold_convert (uutype, expr);
3016       cbase = fold_convert (uutype, cbase);
3017       cstep = fold_convert (uutype, cstep);
3018
3019       /* If the conversion is not noop, we must take it into account when
3020          considering the value of the step.  */
3021       if (TYPE_PRECISION (utype) < TYPE_PRECISION (ctype))
3022         cstep_orig = cstep;
3023     }
3024
3025   if (cst_and_fits_in_hwi (cstep_orig)
3026       && cst_and_fits_in_hwi (ustep_orig))
3027     {
3028       ustepi = int_cst_value (ustep_orig);
3029       cstepi = int_cst_value (cstep_orig);
3030
3031       if (!divide (TYPE_PRECISION (uutype), ustepi, cstepi, &ratioi))
3032         {
3033           /* TODO maybe consider case when ustep divides cstep and the ratio is
3034              a power of 2 (so that the division is fast to execute)?  We would
3035              need to be much more careful with overflows etc. then.  */
3036           return false;
3037         }
3038
3039       ratio = build_int_cst_type (uutype, ratioi);
3040     }
3041   else
3042     {
3043       ratio = constant_multiple_of (uutype, ustep_orig, cstep_orig);
3044       if (!ratio)
3045         return false;
3046
3047       /* Ratioi is only used to detect special cases when the multiplicative
3048          factor is 1 or -1, so if we cannot convert ratio to HOST_WIDE_INT,
3049          we may set it to 0.  We prefer cst_and_fits_in_hwi/int_cst_value
3050          to integer_onep/integer_all_onesp, since the former ignores
3051          TREE_OVERFLOW.  */
3052       if (cst_and_fits_in_hwi (ratio))
3053         ratioi = int_cst_value (ratio);
3054       else if (integer_onep (ratio))
3055         ratioi = 1;
3056       else if (integer_all_onesp (ratio))
3057         ratioi = -1;
3058       else
3059         ratioi = 0;
3060     }
3061
3062   /* We may need to shift the value if we are after the increment.  */
3063   if (stmt_after_increment (loop, cand, at))
3064     cbase = fold_build2 (PLUS_EXPR, uutype, cbase, cstep);
3065
3066   /* use = ubase - ratio * cbase + ratio * var.
3067
3068      In general case ubase + ratio * (var - cbase) could be better (one less
3069      multiplication), but often it is possible to eliminate redundant parts
3070      of computations from (ubase - ratio * cbase) term, and if it does not
3071      happen, fold is able to apply the distributive law to obtain this form
3072      anyway.  */
3073
3074   if (TYPE_PRECISION (uutype) > HOST_BITS_PER_WIDE_INT)
3075     {
3076       /* Let's compute in trees and just return the result in AFF.  This case
3077          should not be very common, and fold itself is not that bad either,
3078          so making the aff. functions more complicated to handle this case
3079          is not that urgent.  */
3080       if (ratioi == 1)
3081         {
3082           delta = fold_build2 (MINUS_EXPR, uutype, ubase, cbase);
3083           expr = fold_build2 (PLUS_EXPR, uutype, expr, delta);
3084         }
3085       else if (ratioi == -1)
3086         {
3087           delta = fold_build2 (PLUS_EXPR, uutype, ubase, cbase);
3088           expr = fold_build2 (MINUS_EXPR, uutype, delta, expr);
3089         }
3090       else
3091         {
3092           delta = fold_build2 (MULT_EXPR, uutype, cbase, ratio);
3093           delta = fold_build2 (MINUS_EXPR, uutype, ubase, delta);
3094           expr = fold_build2 (MULT_EXPR, uutype, ratio, expr);
3095           expr = fold_build2 (PLUS_EXPR, uutype, delta, expr);
3096         }
3097
3098       aff->type = uutype;
3099       aff->n = 0;
3100       aff->offset = 0;
3101       aff->mask = 0;
3102       aff->rest = expr;
3103       return true;
3104     }
3105
3106   /* If we got here, the types fits in HOST_WIDE_INT, thus it must be
3107      possible to compute ratioi.  */
3108   gcc_assert (ratioi);
3109
3110   tree_to_aff_combination (ubase, uutype, aff);
3111   tree_to_aff_combination (cbase, uutype, &cbase_aff);
3112   tree_to_aff_combination (expr, uutype, &expr_aff);
3113   aff_combination_scale (&cbase_aff, -ratioi);
3114   aff_combination_scale (&expr_aff, ratioi);
3115   aff_combination_add (aff, &cbase_aff);
3116   aff_combination_add (aff, &expr_aff);
3117
3118   return true;
3119 }
3120
3121 /* Determines the expression by that USE is expressed from induction variable
3122    CAND at statement AT in LOOP.  The computation is unshared.  */
3123
3124 static tree
3125 get_computation_at (struct loop *loop,
3126                     struct iv_use *use, struct iv_cand *cand, tree at)
3127 {
3128   struct affine_tree_combination aff;
3129   tree type = TREE_TYPE (use->iv->base);
3130
3131   if (!get_computation_aff (loop, use, cand, at, &aff))
3132     return NULL_TREE;
3133   unshare_aff_combination (&aff);
3134   return fold_convert (type, aff_combination_to_tree (&aff));
3135 }
3136
3137 /* Determines the expression by that USE is expressed from induction variable
3138    CAND in LOOP.  The computation is unshared.  */
3139
3140 static tree
3141 get_computation (struct loop *loop, struct iv_use *use, struct iv_cand *cand)
3142 {
3143   return get_computation_at (loop, use, cand, use->stmt);
3144 }
3145
3146 /* Returns cost of addition in MODE.  */
3147
3148 static unsigned
3149 add_cost (enum machine_mode mode)
3150 {
3151   static unsigned costs[NUM_MACHINE_MODES];
3152   rtx seq;
3153   unsigned cost;
3154
3155   if (costs[mode])
3156     return costs[mode];
3157
3158   start_sequence ();
3159   force_operand (gen_rtx_fmt_ee (PLUS, mode,
3160                                  gen_raw_REG (mode, LAST_VIRTUAL_REGISTER + 1),
3161                                  gen_raw_REG (mode, LAST_VIRTUAL_REGISTER + 2)),
3162                  NULL_RTX);
3163   seq = get_insns ();
3164   end_sequence ();
3165
3166   cost = seq_cost (seq);
3167   if (!cost)
3168     cost = 1;
3169
3170   costs[mode] = cost;
3171
3172   if (dump_file && (dump_flags & TDF_DETAILS))
3173     fprintf (dump_file, "Addition in %s costs %d\n",
3174              GET_MODE_NAME (mode), cost);
3175   return cost;
3176 }
3177
3178 /* Entry in a hashtable of already known costs for multiplication.  */
3179 struct mbc_entry
3180 {
3181   HOST_WIDE_INT cst;            /* The constant to multiply by.  */
3182   enum machine_mode mode;       /* In mode.  */
3183   unsigned cost;                /* The cost.  */
3184 };
3185
3186 /* Counts hash value for the ENTRY.  */
3187
3188 static hashval_t
3189 mbc_entry_hash (const void *entry)
3190 {
3191   const struct mbc_entry *e = entry;
3192
3193   return 57 * (hashval_t) e->mode + (hashval_t) (e->cst % 877);
3194 }
3195
3196 /* Compares the hash table entries ENTRY1 and ENTRY2.  */
3197
3198 static int
3199 mbc_entry_eq (const void *entry1, const void *entry2)
3200 {
3201   const struct mbc_entry *e1 = entry1;
3202   const struct mbc_entry *e2 = entry2;
3203
3204   return (e1->mode == e2->mode
3205           && e1->cst == e2->cst);
3206 }
3207
3208 /* Returns cost of multiplication by constant CST in MODE.  */
3209
3210 unsigned
3211 multiply_by_cost (HOST_WIDE_INT cst, enum machine_mode mode)
3212 {
3213   static htab_t costs;
3214   struct mbc_entry **cached, act;
3215   rtx seq;
3216   unsigned cost;
3217
3218   if (!costs)
3219     costs = htab_create (100, mbc_entry_hash, mbc_entry_eq, free);
3220
3221   act.mode = mode;
3222   act.cst = cst;
3223   cached = (struct mbc_entry **) htab_find_slot (costs, &act, INSERT);
3224   if (*cached)
3225     return (*cached)->cost;
3226
3227   *cached = XNEW (struct mbc_entry);
3228   (*cached)->mode = mode;
3229   (*cached)->cst = cst;
3230
3231   start_sequence ();
3232   expand_mult (mode, gen_raw_REG (mode, LAST_VIRTUAL_REGISTER + 1),
3233                gen_int_mode (cst, mode), NULL_RTX, 0);
3234   seq = get_insns ();
3235   end_sequence ();
3236
3237   cost = seq_cost (seq);
3238
3239   if (dump_file && (dump_flags & TDF_DETAILS))
3240     fprintf (dump_file, "Multiplication by %d in %s costs %d\n",
3241              (int) cst, GET_MODE_NAME (mode), cost);
3242
3243   (*cached)->cost = cost;
3244
3245   return cost;
3246 }
3247
3248 /* Returns true if multiplying by RATIO is allowed in address.  */
3249
3250 bool
3251 multiplier_allowed_in_address_p (HOST_WIDE_INT ratio)
3252 {
3253 #define MAX_RATIO 128
3254   static sbitmap valid_mult;
3255
3256   if (!valid_mult)
3257     {
3258       rtx reg1 = gen_raw_REG (Pmode, LAST_VIRTUAL_REGISTER + 1);
3259       rtx addr;
3260       HOST_WIDE_INT i;
3261
3262       valid_mult = sbitmap_alloc (2 * MAX_RATIO + 1);
3263       sbitmap_zero (valid_mult);
3264       addr = gen_rtx_fmt_ee (MULT, Pmode, reg1, NULL_RTX);
3265       for (i = -MAX_RATIO; i <= MAX_RATIO; i++)
3266         {
3267           XEXP (addr, 1) = gen_int_mode (i, Pmode);
3268           if (memory_address_p (Pmode, addr))
3269             SET_BIT (valid_mult, i + MAX_RATIO);
3270         }
3271
3272       if (dump_file && (dump_flags & TDF_DETAILS))
3273         {
3274           fprintf (dump_file, "  allowed multipliers:");
3275           for (i = -MAX_RATIO; i <= MAX_RATIO; i++)
3276             if (TEST_BIT (valid_mult, i + MAX_RATIO))
3277               fprintf (dump_file, " %d", (int) i);
3278           fprintf (dump_file, "\n");
3279           fprintf (dump_file, "\n");
3280         }
3281     }
3282
3283   if (ratio > MAX_RATIO || ratio < -MAX_RATIO)
3284     return false;
3285
3286   return TEST_BIT (valid_mult, ratio + MAX_RATIO);
3287 }
3288
3289 /* Returns cost of address in shape symbol + var + OFFSET + RATIO * index.
3290    If SYMBOL_PRESENT is false, symbol is omitted.  If VAR_PRESENT is false,
3291    variable is omitted.  The created memory accesses MODE.
3292
3293    TODO -- there must be some better way.  This all is quite crude.  */
3294
3295 static unsigned
3296 get_address_cost (bool symbol_present, bool var_present,
3297                   unsigned HOST_WIDE_INT offset, HOST_WIDE_INT ratio)
3298 {
3299   static bool initialized = false;
3300   static HOST_WIDE_INT rat, off;
3301   static HOST_WIDE_INT min_offset, max_offset;
3302   static unsigned costs[2][2][2][2];
3303   unsigned cost, acost;
3304   rtx seq, addr, base;
3305   bool offset_p, ratio_p;
3306   rtx reg1;
3307   HOST_WIDE_INT s_offset;
3308   unsigned HOST_WIDE_INT mask;
3309   unsigned bits;
3310
3311   if (!initialized)
3312     {
3313       HOST_WIDE_INT i;
3314       initialized = true;
3315
3316       reg1 = gen_raw_REG (Pmode, LAST_VIRTUAL_REGISTER + 1);
3317
3318       addr = gen_rtx_fmt_ee (PLUS, Pmode, reg1, NULL_RTX);
3319       for (i = 1; i <= 1 << 20; i <<= 1)
3320         {
3321           XEXP (addr, 1) = gen_int_mode (i, Pmode);
3322           if (!memory_address_p (Pmode, addr))
3323             break;
3324         }
3325       max_offset = i >> 1;
3326       off = max_offset;
3327
3328       for (i = 1; i <= 1 << 20; i <<= 1)
3329         {
3330           XEXP (addr, 1) = gen_int_mode (-i, Pmode);
3331           if (!memory_address_p (Pmode, addr))
3332             break;
3333         }
3334       min_offset = -(i >> 1);
3335
3336       if (dump_file && (dump_flags & TDF_DETAILS))
3337         {
3338           fprintf (dump_file, "get_address_cost:\n");
3339           fprintf (dump_file, "  min offset %d\n", (int) min_offset);
3340           fprintf (dump_file, "  max offset %d\n", (int) max_offset);
3341         }
3342
3343       rat = 1;
3344       for (i = 2; i <= MAX_RATIO; i++)
3345         if (multiplier_allowed_in_address_p (i))
3346           {
3347             rat = i;
3348             break;
3349           }
3350     }
3351
3352   bits = GET_MODE_BITSIZE (Pmode);
3353   mask = ~(~(unsigned HOST_WIDE_INT) 0 << (bits - 1) << 1);
3354   offset &= mask;
3355   if ((offset >> (bits - 1) & 1))
3356     offset |= ~mask;
3357   s_offset = offset;
3358
3359   cost = 0;
3360   offset_p = (s_offset != 0
3361               && min_offset <= s_offset && s_offset <= max_offset);
3362   ratio_p = (ratio != 1
3363              && multiplier_allowed_in_address_p (ratio));
3364
3365   if (ratio != 1 && !ratio_p)
3366     cost += multiply_by_cost (ratio, Pmode);
3367
3368   if (s_offset && !offset_p && !symbol_present)
3369     {
3370       cost += add_cost (Pmode);
3371       var_present = true;
3372     }
3373
3374   acost = costs[symbol_present][var_present][offset_p][ratio_p];
3375   if (!acost)
3376     {
3377       int old_cse_not_expected;
3378       acost = 0;
3379
3380       addr = gen_raw_REG (Pmode, LAST_VIRTUAL_REGISTER + 1);
3381       reg1 = gen_raw_REG (Pmode, LAST_VIRTUAL_REGISTER + 2);
3382       if (ratio_p)
3383         addr = gen_rtx_fmt_ee (MULT, Pmode, addr, gen_int_mode (rat, Pmode));
3384
3385       if (var_present)
3386         addr = gen_rtx_fmt_ee (PLUS, Pmode, addr, reg1);
3387
3388       if (symbol_present)
3389         {
3390           base = gen_rtx_SYMBOL_REF (Pmode, ggc_strdup (""));
3391           if (offset_p)
3392             base = gen_rtx_fmt_e (CONST, Pmode,
3393                                   gen_rtx_fmt_ee (PLUS, Pmode,
3394                                                   base,
3395                                                   gen_int_mode (off, Pmode)));
3396         }
3397       else if (offset_p)
3398         base = gen_int_mode (off, Pmode);
3399       else
3400         base = NULL_RTX;
3401
3402       if (base)
3403         addr = gen_rtx_fmt_ee (PLUS, Pmode, addr, base);
3404
3405       start_sequence ();
3406       /* To avoid splitting addressing modes, pretend that no cse will
3407          follow.  */
3408       old_cse_not_expected = cse_not_expected;
3409       cse_not_expected = true;
3410       addr = memory_address (Pmode, addr);
3411       cse_not_expected = old_cse_not_expected;
3412       seq = get_insns ();
3413       end_sequence ();
3414
3415       acost = seq_cost (seq);
3416       acost += address_cost (addr, Pmode);
3417
3418       if (!acost)
3419         acost = 1;
3420       costs[symbol_present][var_present][offset_p][ratio_p] = acost;
3421     }
3422
3423   return cost + acost;
3424 }
3425
3426 /* Estimates cost of forcing expression EXPR into a variable.  */
3427
3428 unsigned
3429 force_expr_to_var_cost (tree expr)
3430 {
3431   static bool costs_initialized = false;
3432   static unsigned integer_cost;
3433   static unsigned symbol_cost;
3434   static unsigned address_cost;
3435   tree op0, op1;
3436   unsigned cost0, cost1, cost;
3437   enum machine_mode mode;
3438
3439   if (!costs_initialized)
3440     {
3441       tree var = create_tmp_var_raw (integer_type_node, "test_var");
3442       rtx x = gen_rtx_MEM (DECL_MODE (var),
3443                            gen_rtx_SYMBOL_REF (Pmode, "test_var"));
3444       tree addr;
3445       tree type = build_pointer_type (integer_type_node);
3446
3447       integer_cost = computation_cost (build_int_cst (integer_type_node,
3448                                                       2000));
3449
3450       SET_DECL_RTL (var, x);
3451       TREE_STATIC (var) = 1;
3452       addr = build1 (ADDR_EXPR, type, var);
3453       symbol_cost = computation_cost (addr) + 1;
3454
3455       address_cost
3456         = computation_cost (build2 (PLUS_EXPR, type,
3457                                     addr,
3458                                     build_int_cst (type, 2000))) + 1;
3459       if (dump_file && (dump_flags & TDF_DETAILS))
3460         {
3461           fprintf (dump_file, "force_expr_to_var_cost:\n");
3462           fprintf (dump_file, "  integer %d\n", (int) integer_cost);
3463           fprintf (dump_file, "  symbol %d\n", (int) symbol_cost);
3464           fprintf (dump_file, "  address %d\n", (int) address_cost);
3465           fprintf (dump_file, "  other %d\n", (int) target_spill_cost);
3466           fprintf (dump_file, "\n");
3467         }
3468
3469       costs_initialized = true;
3470     }
3471
3472   STRIP_NOPS (expr);
3473
3474   if (SSA_VAR_P (expr))
3475     return 0;
3476
3477   if (TREE_INVARIANT (expr))
3478     {
3479       if (TREE_CODE (expr) == INTEGER_CST)
3480         return integer_cost;
3481
3482       if (TREE_CODE (expr) == ADDR_EXPR)
3483         {
3484           tree obj = TREE_OPERAND (expr, 0);
3485
3486           if (TREE_CODE (obj) == VAR_DECL
3487               || TREE_CODE (obj) == PARM_DECL
3488               || TREE_CODE (obj) == RESULT_DECL)
3489             return symbol_cost;
3490         }
3491
3492       return address_cost;
3493     }
3494
3495   switch (TREE_CODE (expr))
3496     {
3497     case PLUS_EXPR:
3498     case MINUS_EXPR:
3499     case MULT_EXPR:
3500       op0 = TREE_OPERAND (expr, 0);
3501       op1 = TREE_OPERAND (expr, 1);
3502       STRIP_NOPS (op0);
3503       STRIP_NOPS (op1);
3504
3505       if (is_gimple_val (op0))
3506         cost0 = 0;
3507       else
3508         cost0 = force_expr_to_var_cost (op0);
3509
3510       if (is_gimple_val (op1))
3511         cost1 = 0;
3512       else
3513         cost1 = force_expr_to_var_cost (op1);
3514
3515       break;
3516
3517     default:
3518       /* Just an arbitrary value, FIXME.  */
3519       return target_spill_cost;
3520     }
3521
3522   mode = TYPE_MODE (TREE_TYPE (expr));
3523   switch (TREE_CODE (expr))
3524     {
3525     case PLUS_EXPR:
3526     case MINUS_EXPR:
3527       cost = add_cost (mode);
3528       break;
3529
3530     case MULT_EXPR:
3531       if (cst_and_fits_in_hwi (op0))
3532         cost = multiply_by_cost (int_cst_value (op0), mode);
3533       else if (cst_and_fits_in_hwi (op1))
3534         cost = multiply_by_cost (int_cst_value (op1), mode);
3535       else
3536         return target_spill_cost;
3537       break;
3538
3539     default:
3540       gcc_unreachable ();
3541     }
3542
3543   cost += cost0;
3544   cost += cost1;
3545
3546   /* Bound the cost by target_spill_cost.  The parts of complicated
3547      computations often are either loop invariant or at least can
3548      be shared between several iv uses, so letting this grow without
3549      limits would not give reasonable results.  */
3550   return cost < target_spill_cost ? cost : target_spill_cost;
3551 }
3552
3553 /* Estimates cost of forcing EXPR into a variable.  DEPENDS_ON is a set of the
3554    invariants the computation depends on.  */
3555
3556 static unsigned
3557 force_var_cost (struct ivopts_data *data,
3558                 tree expr, bitmap *depends_on)
3559 {
3560   if (depends_on)
3561     {
3562       fd_ivopts_data = data;
3563       walk_tree (&expr, find_depends, depends_on, NULL);
3564     }
3565
3566   return force_expr_to_var_cost (expr);
3567 }
3568
3569 /* Estimates cost of expressing address ADDR  as var + symbol + offset.  The
3570    value of offset is added to OFFSET, SYMBOL_PRESENT and VAR_PRESENT are set
3571    to false if the corresponding part is missing.  DEPENDS_ON is a set of the
3572    invariants the computation depends on.  */
3573
3574 static unsigned
3575 split_address_cost (struct ivopts_data *data,
3576                     tree addr, bool *symbol_present, bool *var_present,
3577                     unsigned HOST_WIDE_INT *offset, bitmap *depends_on)
3578 {
3579   tree core;
3580   HOST_WIDE_INT bitsize;
3581   HOST_WIDE_INT bitpos;
3582   tree toffset;
3583   enum machine_mode mode;
3584   int unsignedp, volatilep;
3585
3586   core = get_inner_reference (addr, &bitsize, &bitpos, &toffset, &mode,
3587                               &unsignedp, &volatilep, false);
3588
3589   if (toffset != 0
3590       || bitpos % BITS_PER_UNIT != 0
3591       || TREE_CODE (core) != VAR_DECL)
3592     {
3593       *symbol_present = false;
3594       *var_present = true;
3595       fd_ivopts_data = data;
3596       walk_tree (&addr, find_depends, depends_on, NULL);
3597       return target_spill_cost;
3598     }
3599
3600   *offset += bitpos / BITS_PER_UNIT;
3601   if (TREE_STATIC (core)
3602       || DECL_EXTERNAL (core))
3603     {
3604       *symbol_present = true;
3605       *var_present = false;
3606       return 0;
3607     }
3608
3609   *symbol_present = false;
3610   *var_present = true;
3611   return 0;
3612 }
3613
3614 /* Estimates cost of expressing difference of addresses E1 - E2 as
3615    var + symbol + offset.  The value of offset is added to OFFSET,
3616    SYMBOL_PRESENT and VAR_PRESENT are set to false if the corresponding
3617    part is missing.  DEPENDS_ON is a set of the invariants the computation
3618    depends on.  */
3619
3620 static unsigned
3621 ptr_difference_cost (struct ivopts_data *data,
3622                      tree e1, tree e2, bool *symbol_present, bool *var_present,
3623                      unsigned HOST_WIDE_INT *offset, bitmap *depends_on)
3624 {
3625   HOST_WIDE_INT diff = 0;
3626   unsigned cost;
3627
3628   gcc_assert (TREE_CODE (e1) == ADDR_EXPR);
3629
3630   if (ptr_difference_const (e1, e2, &diff))
3631     {
3632       *offset += diff;
3633       *symbol_present = false;
3634       *var_present = false;
3635       return 0;
3636     }
3637
3638   if (e2 == integer_zero_node)
3639     return split_address_cost (data, TREE_OPERAND (e1, 0),
3640                                symbol_present, var_present, offset, depends_on);
3641
3642   *symbol_present = false;
3643   *var_present = true;
3644
3645   cost = force_var_cost (data, e1, depends_on);
3646   cost += force_var_cost (data, e2, depends_on);
3647   cost += add_cost (Pmode);
3648
3649   return cost;
3650 }
3651
3652 /* Estimates cost of expressing difference E1 - E2 as
3653    var + symbol + offset.  The value of offset is added to OFFSET,
3654    SYMBOL_PRESENT and VAR_PRESENT are set to false if the corresponding
3655    part is missing.  DEPENDS_ON is a set of the invariants the computation
3656    depends on.  */
3657
3658 static unsigned
3659 difference_cost (struct ivopts_data *data,
3660                  tree e1, tree e2, bool *symbol_present, bool *var_present,
3661                  unsigned HOST_WIDE_INT *offset, bitmap *depends_on)
3662 {
3663   unsigned cost;
3664   enum machine_mode mode = TYPE_MODE (TREE_TYPE (e1));
3665   unsigned HOST_WIDE_INT off1, off2;
3666
3667   e1 = strip_offset (e1, &off1);
3668   e2 = strip_offset (e2, &off2);
3669   *offset += off1 - off2;
3670
3671   STRIP_NOPS (e1);
3672   STRIP_NOPS (e2);
3673
3674   if (TREE_CODE (e1) == ADDR_EXPR)
3675     return ptr_difference_cost (data, e1, e2, symbol_present, var_present, offset,
3676                                 depends_on);
3677   *symbol_present = false;
3678
3679   if (operand_equal_p (e1, e2, 0))
3680     {
3681       *var_present = false;
3682       return 0;
3683     }
3684   *var_present = true;
3685   if (zero_p (e2))
3686     return force_var_cost (data, e1, depends_on);
3687
3688   if (zero_p (e1))
3689     {
3690       cost = force_var_cost (data, e2, depends_on);
3691       cost += multiply_by_cost (-1, mode);
3692
3693       return cost;
3694     }
3695
3696   cost = force_var_cost (data, e1, depends_on);
3697   cost += force_var_cost (data, e2, depends_on);
3698   cost += add_cost (mode);
3699
3700   return cost;
3701 }
3702
3703 /* Determines the cost of the computation by that USE is expressed
3704    from induction variable CAND.  If ADDRESS_P is true, we just need
3705    to create an address from it, otherwise we want to get it into
3706    register.  A set of invariants we depend on is stored in
3707    DEPENDS_ON.  AT is the statement at that the value is computed.  */
3708
3709 static unsigned
3710 get_computation_cost_at (struct ivopts_data *data,
3711                          struct iv_use *use, struct iv_cand *cand,
3712                          bool address_p, bitmap *depends_on, tree at)
3713 {
3714   tree ubase = use->iv->base, ustep = use->iv->step;
3715   tree cbase, cstep;
3716   tree utype = TREE_TYPE (ubase), ctype;
3717   unsigned HOST_WIDE_INT ustepi, cstepi, offset = 0;
3718   HOST_WIDE_INT ratio, aratio;
3719   bool var_present, symbol_present;
3720   unsigned cost = 0, n_sums;
3721
3722   *depends_on = NULL;
3723
3724   /* Only consider real candidates.  */
3725   if (!cand->iv)
3726     return INFTY;
3727
3728   cbase = cand->iv->base;
3729   cstep = cand->iv->step;
3730   ctype = TREE_TYPE (cbase);
3731
3732   if (TYPE_PRECISION (utype) > TYPE_PRECISION (ctype))
3733     {
3734       /* We do not have a precision to express the values of use.  */
3735       return INFTY;
3736     }
3737
3738   if (address_p)
3739     {
3740       /* Do not try to express address of an object with computation based
3741          on address of a different object.  This may cause problems in rtl
3742          level alias analysis (that does not expect this to be happening,
3743          as this is illegal in C), and would be unlikely to be useful
3744          anyway.  */
3745       if (use->iv->base_object
3746           && cand->iv->base_object
3747           && !operand_equal_p (use->iv->base_object, cand->iv->base_object, 0))
3748         return INFTY;
3749     }
3750
3751   if (TYPE_PRECISION (utype) != TYPE_PRECISION (ctype))
3752     {
3753       /* TODO -- add direct handling of this case.  */
3754       goto fallback;
3755     }
3756
3757   /* CSTEPI is removed from the offset in case statement is after the
3758      increment.  If the step is not constant, we use zero instead.
3759      This is a bit imprecise (there is the extra addition), but
3760      redundancy elimination is likely to transform the code so that
3761      it uses value of the variable before increment anyway,
3762      so it is not that much unrealistic.  */
3763   if (cst_and_fits_in_hwi (cstep))
3764     cstepi = int_cst_value (cstep);
3765   else
3766     cstepi = 0;
3767
3768   if (cst_and_fits_in_hwi (ustep)
3769       && cst_and_fits_in_hwi (cstep))
3770     {
3771       ustepi = int_cst_value (ustep);
3772
3773       if (!divide (TYPE_PRECISION (utype), ustepi, cstepi, &ratio))
3774         return INFTY;
3775     }
3776   else
3777     {
3778       tree rat;
3779
3780       rat = constant_multiple_of (utype, ustep, cstep);
3781
3782       if (!rat)
3783         return INFTY;
3784
3785       if (cst_and_fits_in_hwi (rat))
3786         ratio = int_cst_value (rat);
3787       else if (integer_onep (rat))
3788         ratio = 1;
3789       else if (integer_all_onesp (rat))
3790         ratio = -1;
3791       else
3792         return INFTY;
3793     }
3794
3795   /* use = ubase + ratio * (var - cbase).  If either cbase is a constant
3796      or ratio == 1, it is better to handle this like
3797
3798      ubase - ratio * cbase + ratio * var
3799
3800      (also holds in the case ratio == -1, TODO.  */
3801
3802   if (cst_and_fits_in_hwi (cbase))
3803     {
3804       offset = - ratio * int_cst_value (cbase);
3805       cost += difference_cost (data,
3806                                ubase, integer_zero_node,
3807                                &symbol_present, &var_present, &offset,
3808                                depends_on);
3809     }
3810   else if (ratio == 1)
3811     {
3812       cost += difference_cost (data,
3813                                ubase, cbase,
3814                                &symbol_present, &var_present, &offset,
3815                                depends_on);
3816     }
3817   else
3818     {
3819       cost += force_var_cost (data, cbase, depends_on);
3820       cost += add_cost (TYPE_MODE (ctype));
3821       cost += difference_cost (data,
3822                                ubase, integer_zero_node,
3823                                &symbol_present, &var_present, &offset,
3824                                depends_on);
3825     }
3826
3827   /* If we are after the increment, the value of the candidate is higher by
3828      one iteration.  */
3829   if (stmt_after_increment (data->current_loop, cand, at))
3830     offset -= ratio * cstepi;
3831
3832   /* Now the computation is in shape symbol + var1 + const + ratio * var2.
3833      (symbol/var/const parts may be omitted).  If we are looking for an address,
3834      find the cost of addressing this.  */
3835   if (address_p)
3836     return cost + get_address_cost (symbol_present, var_present, offset, ratio);
3837
3838   /* Otherwise estimate the costs for computing the expression.  */
3839   aratio = ratio > 0 ? ratio : -ratio;
3840   if (!symbol_present && !var_present && !offset)
3841     {
3842       if (ratio != 1)
3843         cost += multiply_by_cost (ratio, TYPE_MODE (ctype));
3844
3845       return cost;
3846     }
3847
3848   if (aratio != 1)
3849     cost += multiply_by_cost (aratio, TYPE_MODE (ctype));
3850
3851   n_sums = 1;
3852   if (var_present
3853       /* Symbol + offset should be compile-time computable.  */
3854       && (symbol_present || offset))
3855     n_sums++;
3856
3857   return cost + n_sums * add_cost (TYPE_MODE (ctype));
3858
3859 fallback:
3860   {
3861     /* Just get the expression, expand it and measure the cost.  */
3862     tree comp = get_computation_at (data->current_loop, use, cand, at);
3863
3864     if (!comp)
3865       return INFTY;
3866
3867     if (address_p)
3868       comp = build1 (INDIRECT_REF, TREE_TYPE (TREE_TYPE (comp)), comp);
3869
3870     return computation_cost (comp);
3871   }
3872 }
3873
3874 /* Determines the cost of the computation by that USE is expressed
3875    from induction variable CAND.  If ADDRESS_P is true, we just need
3876    to create an address from it, otherwise we want to get it into
3877    register.  A set of invariants we depend on is stored in
3878    DEPENDS_ON.  */
3879
3880 static unsigned
3881 get_computation_cost (struct ivopts_data *data,
3882                       struct iv_use *use, struct iv_cand *cand,
3883                       bool address_p, bitmap *depends_on)
3884 {
3885   return get_computation_cost_at (data,
3886                                   use, cand, address_p, depends_on, use->stmt);
3887 }
3888
3889 /* Determines cost of basing replacement of USE on CAND in a generic
3890    expression.  */
3891
3892 static bool
3893 determine_use_iv_cost_generic (struct ivopts_data *data,
3894                                struct iv_use *use, struct iv_cand *cand)
3895 {
3896   bitmap depends_on;
3897   unsigned cost;
3898
3899   /* The simple case first -- if we need to express value of the preserved
3900      original biv, the cost is 0.  This also prevents us from counting the
3901      cost of increment twice -- once at this use and once in the cost of
3902      the candidate.  */
3903   if (cand->pos == IP_ORIGINAL
3904       && cand->incremented_at == use->stmt)
3905     {
3906       set_use_iv_cost (data, use, cand, 0, NULL, NULL_TREE);
3907       return true;
3908     }
3909
3910   cost = get_computation_cost (data, use, cand, false, &depends_on);
3911   set_use_iv_cost (data, use, cand, cost, depends_on, NULL_TREE);
3912
3913   return cost != INFTY;
3914 }
3915
3916 /* Determines cost of basing replacement of USE on CAND in an address.  */
3917
3918 static bool
3919 determine_use_iv_cost_address (struct ivopts_data *data,
3920                                struct iv_use *use, struct iv_cand *cand)
3921 {
3922   bitmap depends_on;
3923   unsigned cost = get_computation_cost (data, use, cand, true, &depends_on);
3924
3925   set_use_iv_cost (data, use, cand, cost, depends_on, NULL_TREE);
3926
3927   return cost != INFTY;
3928 }
3929
3930 /* Computes value of induction variable IV in iteration NITER.  */
3931
3932 static tree
3933 iv_value (struct iv *iv, tree niter)
3934 {
3935   tree val;
3936   tree type = TREE_TYPE (iv->base);
3937
3938   niter = fold_convert (type, niter);
3939   val = fold_build2 (MULT_EXPR, type, iv->step, niter);
3940
3941   return fold_build2 (PLUS_EXPR, type, iv->base, val);
3942 }
3943
3944 /* Computes value of candidate CAND at position AT in iteration NITER.  */
3945
3946 static tree
3947 cand_value_at (struct loop *loop, struct iv_cand *cand, tree at, tree niter)
3948 {
3949   tree val = iv_value (cand->iv, niter);
3950   tree type = TREE_TYPE (cand->iv->base);
3951
3952   if (stmt_after_increment (loop, cand, at))
3953     val = fold_build2 (PLUS_EXPR, type, val, cand->iv->step);
3954
3955   return val;
3956 }
3957
3958 /* Returns period of induction variable iv.  */
3959
3960 static tree
3961 iv_period (struct iv *iv)
3962 {
3963   tree step = iv->step, period, type;
3964   tree pow2div;
3965
3966   gcc_assert (step && TREE_CODE (step) == INTEGER_CST);
3967
3968   /* Period of the iv is gcd (step, type range).  Since type range is power
3969      of two, it suffices to determine the maximum power of two that divides
3970      step.  */
3971   pow2div = num_ending_zeros (step);
3972   type = unsigned_type_for (TREE_TYPE (step));
3973
3974   period = build_low_bits_mask (type,
3975                                 (TYPE_PRECISION (type)
3976                                  - tree_low_cst (pow2div, 1)));
3977
3978   return period;
3979 }
3980
3981 /* Returns the comparison operator used when eliminating the iv USE.  */
3982
3983 static enum tree_code
3984 iv_elimination_compare (struct ivopts_data *data, struct iv_use *use)
3985 {
3986   struct loop *loop = data->current_loop;
3987   basic_block ex_bb;
3988   edge exit;
3989
3990   ex_bb = bb_for_stmt (use->stmt);
3991   exit = EDGE_SUCC (ex_bb, 0);
3992   if (flow_bb_inside_loop_p (loop, exit->dest))
3993     exit = EDGE_SUCC (ex_bb, 1);
3994
3995   return (exit->flags & EDGE_TRUE_VALUE ? EQ_EXPR : NE_EXPR);
3996 }
3997
3998 /* Check whether it is possible to express the condition in USE by comparison
3999    of candidate CAND.  If so, store the value compared with to BOUND.  */
4000
4001 static bool
4002 may_eliminate_iv (struct ivopts_data *data,
4003                   struct iv_use *use, struct iv_cand *cand, tree *bound)
4004 {
4005   basic_block ex_bb;
4006   edge exit;
4007   tree nit, nit_type;
4008   tree wider_type, period, per_type;
4009   struct loop *loop = data->current_loop;
4010
4011   if (TREE_CODE (cand->iv->step) != INTEGER_CST)
4012     return false;
4013
4014   /* For now works only for exits that dominate the loop latch.  TODO -- extend
4015      for other conditions inside loop body.  */
4016   ex_bb = bb_for_stmt (use->stmt);
4017   if (use->stmt != last_stmt (ex_bb)
4018       || TREE_CODE (use->stmt) != COND_EXPR)
4019     return false;
4020   if (!dominated_by_p (CDI_DOMINATORS, loop->latch, ex_bb))
4021     return false;
4022
4023   exit = EDGE_SUCC (ex_bb, 0);
4024   if (flow_bb_inside_loop_p (loop, exit->dest))
4025     exit = EDGE_SUCC (ex_bb, 1);
4026   if (flow_bb_inside_loop_p (loop, exit->dest))
4027     return false;
4028
4029   nit = niter_for_exit (data, exit);
4030   if (!nit)
4031     return false;
4032
4033   nit_type = TREE_TYPE (nit);
4034
4035   /* Determine whether we may use the variable to test whether niter iterations
4036      elapsed.  This is the case iff the period of the induction variable is
4037      greater than the number of iterations.  */
4038   period = iv_period (cand->iv);
4039   if (!period)
4040     return false;
4041   per_type = TREE_TYPE (period);
4042
4043   wider_type = TREE_TYPE (period);
4044   if (TYPE_PRECISION (nit_type) < TYPE_PRECISION (per_type))
4045     wider_type = per_type;
4046   else
4047     wider_type = nit_type;
4048
4049   if (!integer_nonzerop (fold_build2 (GE_EXPR, boolean_type_node,
4050                                       fold_convert (wider_type, period),
4051                                       fold_convert (wider_type, nit))))
4052     return false;
4053
4054   *bound = fold_affine_expr (cand_value_at (loop, cand, use->stmt, nit));
4055   return true;
4056 }
4057
4058 /* Determines cost of basing replacement of USE on CAND in a condition.  */
4059
4060 static bool
4061 determine_use_iv_cost_condition (struct ivopts_data *data,
4062                                  struct iv_use *use, struct iv_cand *cand)
4063 {
4064   tree bound = NULL_TREE, op, cond;
4065   bitmap depends_on = NULL;
4066   unsigned cost;
4067
4068   /* Only consider real candidates.  */
4069   if (!cand->iv)
4070     {
4071       set_use_iv_cost (data, use, cand, INFTY, NULL, NULL_TREE);
4072       return false;
4073     }
4074
4075   if (may_eliminate_iv (data, use, cand, &bound))
4076     {
4077       cost = force_var_cost (data, bound, &depends_on);
4078
4079       set_use_iv_cost (data, use, cand, cost, depends_on, bound);
4080       return cost != INFTY;
4081     }
4082
4083   /* The induction variable elimination failed; just express the original
4084      giv.  If it is compared with an invariant, note that we cannot get
4085      rid of it.  */
4086   cost = get_computation_cost (data, use, cand, false, &depends_on);
4087
4088   cond = *use->op_p;
4089   if (TREE_CODE (cond) != SSA_NAME)
4090     {
4091       op = TREE_OPERAND (cond, 0);
4092       if (TREE_CODE (op) == SSA_NAME && !zero_p (get_iv (data, op)->step))
4093         op = TREE_OPERAND (cond, 1);
4094       if (TREE_CODE (op) == SSA_NAME)
4095         {
4096           op = get_iv (data, op)->base;
4097           fd_ivopts_data = data;
4098           walk_tree (&op, find_depends, &depends_on, NULL);
4099         }
4100     }
4101
4102   set_use_iv_cost (data, use, cand, cost, depends_on, NULL);
4103   return cost != INFTY;
4104 }
4105
4106 /* Determines cost of basing replacement of USE on CAND.  Returns false
4107    if USE cannot be based on CAND.  */
4108
4109 static bool
4110 determine_use_iv_cost (struct ivopts_data *data,
4111                        struct iv_use *use, struct iv_cand *cand)
4112 {
4113   switch (use->type)
4114     {
4115     case USE_NONLINEAR_EXPR:
4116       return determine_use_iv_cost_generic (data, use, cand);
4117
4118     case USE_ADDRESS:
4119       return determine_use_iv_cost_address (data, use, cand);
4120
4121     case USE_COMPARE:
4122       return determine_use_iv_cost_condition (data, use, cand);
4123
4124     default:
4125       gcc_unreachable ();
4126     }
4127 }
4128
4129 /* Determines costs of basing the use of the iv on an iv candidate.  */
4130
4131 static void
4132 determine_use_iv_costs (struct ivopts_data *data)
4133 {
4134   unsigned i, j;
4135   struct iv_use *use;
4136   struct iv_cand *cand;
4137   bitmap to_clear = BITMAP_ALLOC (NULL);
4138
4139   alloc_use_cost_map (data);
4140
4141   for (i = 0; i < n_iv_uses (data); i++)
4142     {
4143       use = iv_use (data, i);
4144
4145       if (data->consider_all_candidates)
4146         {
4147           for (j = 0; j < n_iv_cands (data); j++)
4148             {
4149               cand = iv_cand (data, j);
4150               determine_use_iv_cost (data, use, cand);
4151             }
4152         }
4153       else
4154         {
4155           bitmap_iterator bi;
4156
4157           EXECUTE_IF_SET_IN_BITMAP (use->related_cands, 0, j, bi)
4158             {
4159               cand = iv_cand (data, j);
4160               if (!determine_use_iv_cost (data, use, cand))
4161                 bitmap_set_bit (to_clear, j);
4162             }
4163
4164           /* Remove the candidates for that the cost is infinite from
4165              the list of related candidates.  */
4166           bitmap_and_compl_into (use->related_cands, to_clear);
4167           bitmap_clear (to_clear);
4168         }
4169     }
4170
4171   BITMAP_FREE (to_clear);
4172
4173   if (dump_file && (dump_flags & TDF_DETAILS))
4174     {
4175       fprintf (dump_file, "Use-candidate costs:\n");
4176
4177       for (i = 0; i < n_iv_uses (data); i++)
4178         {
4179           use = iv_use (data, i);
4180
4181           fprintf (dump_file, "Use %d:\n", i);
4182           fprintf (dump_file, "  cand\tcost\tdepends on\n");
4183           for (j = 0; j < use->n_map_members; j++)
4184             {
4185               if (!use->cost_map[j].cand
4186                   || use->cost_map[j].cost == INFTY)
4187                 continue;
4188
4189               fprintf (dump_file, "  %d\t%d\t",
4190                        use->cost_map[j].cand->id,
4191                        use->cost_map[j].cost);
4192               if (use->cost_map[j].depends_on)
4193                 bitmap_print (dump_file,
4194                               use->cost_map[j].depends_on, "","");
4195               fprintf (dump_file, "\n");
4196             }
4197
4198           fprintf (dump_file, "\n");
4199         }
4200       fprintf (dump_file, "\n");
4201     }
4202 }
4203
4204 /* Determines cost of the candidate CAND.  */
4205
4206 static void
4207 determine_iv_cost (struct ivopts_data *data, struct iv_cand *cand)
4208 {
4209   unsigned cost_base, cost_step;
4210   tree base;
4211
4212   if (!cand->iv)
4213     {
4214       cand->cost = 0;
4215       return;
4216     }
4217
4218   /* There are two costs associated with the candidate -- its increment
4219      and its initialization.  The second is almost negligible for any loop
4220      that rolls enough, so we take it just very little into account.  */
4221
4222   base = cand->iv->base;
4223   cost_base = force_var_cost (data, base, NULL);
4224   cost_step = add_cost (TYPE_MODE (TREE_TYPE (base)));
4225
4226   cand->cost = cost_step + cost_base / AVG_LOOP_NITER (current_loop);
4227
4228   /* Prefer the original iv unless we may gain something by replacing it;
4229      this is not really relevant for artificial ivs created by other
4230      passes.  */
4231   if (cand->pos == IP_ORIGINAL
4232       && !DECL_ARTIFICIAL (SSA_NAME_VAR (cand->var_before)))
4233     cand->cost--;
4234
4235   /* Prefer not to insert statements into latch unless there are some
4236      already (so that we do not create unnecessary jumps).  */
4237   if (cand->pos == IP_END
4238       && empty_block_p (ip_end_pos (data->current_loop)))
4239     cand->cost++;
4240 }
4241
4242 /* Determines costs of computation of the candidates.  */
4243
4244 static void
4245 determine_iv_costs (struct ivopts_data *data)
4246 {
4247   unsigned i;
4248
4249   if (dump_file && (dump_flags & TDF_DETAILS))
4250     {
4251       fprintf (dump_file, "Candidate costs:\n");
4252       fprintf (dump_file, "  cand\tcost\n");
4253     }
4254
4255   for (i = 0; i < n_iv_cands (data); i++)
4256     {
4257       struct iv_cand *cand = iv_cand (data, i);
4258
4259       determine_iv_cost (data, cand);
4260
4261       if (dump_file && (dump_flags & TDF_DETAILS))
4262         fprintf (dump_file, "  %d\t%d\n", i, cand->cost);
4263     }
4264
4265 if (dump_file && (dump_flags & TDF_DETAILS))
4266       fprintf (dump_file, "\n");
4267 }
4268
4269 /* Calculates cost for having SIZE induction variables.  */
4270
4271 static unsigned
4272 ivopts_global_cost_for_size (struct ivopts_data *data, unsigned size)
4273 {
4274   return global_cost_for_size (size, data->regs_used, n_iv_uses (data));
4275 }
4276
4277 /* For each size of the induction variable set determine the penalty.  */
4278
4279 static void
4280 determine_set_costs (struct ivopts_data *data)
4281 {
4282   unsigned j, n;
4283   tree phi, op;
4284   struct loop *loop = data->current_loop;
4285   bitmap_iterator bi;
4286
4287   /* We use the following model (definitely improvable, especially the
4288      cost function -- TODO):
4289
4290      We estimate the number of registers available (using MD data), name it A.
4291
4292      We estimate the number of registers used by the loop, name it U.  This
4293      number is obtained as the number of loop phi nodes (not counting virtual
4294      registers and bivs) + the number of variables from outside of the loop.
4295
4296      We set a reserve R (free regs that are used for temporary computations,
4297      etc.).  For now the reserve is a constant 3.
4298
4299      Let I be the number of induction variables.
4300
4301      -- if U + I + R <= A, the cost is I * SMALL_COST (just not to encourage
4302         make a lot of ivs without a reason).
4303      -- if A - R < U + I <= A, the cost is I * PRES_COST
4304      -- if U + I > A, the cost is I * PRES_COST and
4305         number of uses * SPILL_COST * (U + I - A) / (U + I) is added.  */
4306
4307   if (dump_file && (dump_flags & TDF_DETAILS))
4308     {
4309       fprintf (dump_file, "Global costs:\n");
4310       fprintf (dump_file, "  target_avail_regs %d\n", target_avail_regs);
4311       fprintf (dump_file, "  target_small_cost %d\n", target_small_cost);
4312       fprintf (dump_file, "  target_pres_cost %d\n", target_pres_cost);
4313       fprintf (dump_file, "  target_spill_cost %d\n", target_spill_cost);
4314     }
4315
4316   n = 0;
4317   for (phi = phi_nodes (loop->header); phi; phi = PHI_CHAIN (phi))
4318     {
4319       op = PHI_RESULT (phi);
4320
4321       if (!is_gimple_reg (op))
4322         continue;
4323
4324       if (get_iv (data, op))
4325         continue;
4326
4327       n++;
4328     }
4329
4330   EXECUTE_IF_SET_IN_BITMAP (data->relevant, 0, j, bi)
4331     {
4332       struct version_info *info = ver_info (data, j);
4333
4334       if (info->inv_id && info->has_nonlin_use)
4335         n++;
4336     }
4337
4338   data->regs_used = n;
4339   if (dump_file && (dump_flags & TDF_DETAILS))
4340     fprintf (dump_file, "  regs_used %d\n", n);
4341
4342   if (dump_file && (dump_flags & TDF_DETAILS))
4343     {
4344       fprintf (dump_file, "  cost for size:\n");
4345       fprintf (dump_file, "  ivs\tcost\n");
4346       for (j = 0; j <= 2 * target_avail_regs; j++)
4347         fprintf (dump_file, "  %d\t%d\n", j,
4348                  ivopts_global_cost_for_size (data, j));
4349       fprintf (dump_file, "\n");
4350     }
4351 }
4352
4353 /* Returns true if A is a cheaper cost pair than B.  */
4354
4355 static bool
4356 cheaper_cost_pair (struct cost_pair *a, struct cost_pair *b)
4357 {
4358   if (!a)
4359     return false;
4360
4361   if (!b)
4362     return true;
4363
4364   if (a->cost < b->cost)
4365     return true;
4366
4367   if (a->cost > b->cost)
4368     return false;
4369
4370   /* In case the costs are the same, prefer the cheaper candidate.  */
4371   if (a->cand->cost < b->cand->cost)
4372     return true;
4373
4374   return false;
4375 }
4376
4377 /* Computes the cost field of IVS structure.  */
4378
4379 static void
4380 iv_ca_recount_cost (struct ivopts_data *data, struct iv_ca *ivs)
4381 {
4382   unsigned cost = 0;
4383
4384   cost += ivs->cand_use_cost;
4385   cost += ivs->cand_cost;
4386   cost += ivopts_global_cost_for_size (data, ivs->n_regs);
4387
4388   ivs->cost = cost;
4389 }
4390
4391 /* Remove invariants in set INVS to set IVS.  */
4392
4393 static void
4394 iv_ca_set_remove_invariants (struct iv_ca *ivs, bitmap invs)
4395 {
4396   bitmap_iterator bi;
4397   unsigned iid;
4398
4399   if (!invs)
4400     return;
4401
4402   EXECUTE_IF_SET_IN_BITMAP (invs, 0, iid, bi)
4403     {
4404       ivs->n_invariant_uses[iid]--;
4405       if (ivs->n_invariant_uses[iid] == 0)
4406         ivs->n_regs--;
4407     }
4408 }
4409
4410 /* Set USE not to be expressed by any candidate in IVS.  */
4411
4412 static void
4413 iv_ca_set_no_cp (struct ivopts_data *data, struct iv_ca *ivs,
4414                  struct iv_use *use)
4415 {
4416   unsigned uid = use->id, cid;
4417   struct cost_pair *cp;
4418
4419   cp = ivs->cand_for_use[uid];
4420   if (!cp)
4421     return;
4422   cid = cp->cand->id;
4423
4424   ivs->bad_uses++;
4425   ivs->cand_for_use[uid] = NULL;
4426   ivs->n_cand_uses[cid]--;
4427
4428   if (ivs->n_cand_uses[cid] == 0)
4429     {
4430       bitmap_clear_bit (ivs->cands, cid);
4431       /* Do not count the pseudocandidates.  */
4432       if (cp->cand->iv)
4433         ivs->n_regs--;
4434       ivs->n_cands--;
4435       ivs->cand_cost -= cp->cand->cost;
4436
4437       iv_ca_set_remove_invariants (ivs, cp->cand->depends_on);
4438     }
4439
4440   ivs->cand_use_cost -= cp->cost;
4441
4442   iv_ca_set_remove_invariants (ivs, cp->depends_on);
4443   iv_ca_recount_cost (data, ivs);
4444 }
4445
4446 /* Add invariants in set INVS to set IVS.  */
4447
4448 static void
4449 iv_ca_set_add_invariants (struct iv_ca *ivs, bitmap invs)
4450 {
4451   bitmap_iterator bi;
4452   unsigned iid;
4453
4454   if (!invs)
4455     return;
4456
4457   EXECUTE_IF_SET_IN_BITMAP (invs, 0, iid, bi)
4458     {
4459       ivs->n_invariant_uses[iid]++;
4460       if (ivs->n_invariant_uses[iid] == 1)
4461         ivs->n_regs++;
4462     }
4463 }
4464
4465 /* Set cost pair for USE in set IVS to CP.  */
4466
4467 static void
4468 iv_ca_set_cp (struct ivopts_data *data, struct iv_ca *ivs,
4469               struct iv_use *use, struct cost_pair *cp)
4470 {
4471   unsigned uid = use->id, cid;
4472
4473   if (ivs->cand_for_use[uid] == cp)
4474     return;
4475
4476   if (ivs->cand_for_use[uid])
4477     iv_ca_set_no_cp (data, ivs, use);
4478
4479   if (cp)
4480     {
4481       cid = cp->cand->id;
4482
4483       ivs->bad_uses--;
4484       ivs->cand_for_use[uid] = cp;
4485       ivs->n_cand_uses[cid]++;
4486       if (ivs->n_cand_uses[cid] == 1)
4487         {
4488           bitmap_set_bit (ivs->cands, cid);
4489           /* Do not count the pseudocandidates.  */
4490           if (cp->cand->iv)
4491             ivs->n_regs++;
4492           ivs->n_cands++;
4493           ivs->cand_cost += cp->cand->cost;
4494
4495           iv_ca_set_add_invariants (ivs, cp->cand->depends_on);
4496         }
4497
4498       ivs->cand_use_cost += cp->cost;
4499       iv_ca_set_add_invariants (ivs, cp->depends_on);
4500       iv_ca_recount_cost (data, ivs);
4501     }
4502 }
4503
4504 /* Extend set IVS by expressing USE by some of the candidates in it
4505    if possible.  */
4506
4507 static void
4508 iv_ca_add_use (struct ivopts_data *data, struct iv_ca *ivs,
4509                struct iv_use *use)
4510 {
4511   struct cost_pair *best_cp = NULL, *cp;
4512   bitmap_iterator bi;
4513   unsigned i;
4514
4515   gcc_assert (ivs->upto >= use->id);
4516
4517   if (ivs->upto == use->id)
4518     {
4519       ivs->upto++;
4520       ivs->bad_uses++;
4521     }
4522
4523   EXECUTE_IF_SET_IN_BITMAP (ivs->cands, 0, i, bi)
4524     {
4525       cp = get_use_iv_cost (data, use, iv_cand (data, i));
4526
4527       if (cheaper_cost_pair (cp, best_cp))
4528         best_cp = cp;
4529     }
4530
4531   iv_ca_set_cp (data, ivs, use, best_cp);
4532 }
4533
4534 /* Get cost for assignment IVS.  */
4535
4536 static unsigned
4537 iv_ca_cost (struct iv_ca *ivs)
4538 {
4539   return (ivs->bad_uses ? INFTY : ivs->cost);
4540 }
4541
4542 /* Returns true if all dependences of CP are among invariants in IVS.  */
4543
4544 static bool
4545 iv_ca_has_deps (struct iv_ca *ivs, struct cost_pair *cp)
4546 {
4547   unsigned i;
4548   bitmap_iterator bi;
4549
4550   if (!cp->depends_on)
4551     return true;
4552
4553   EXECUTE_IF_SET_IN_BITMAP (cp->depends_on, 0, i, bi)
4554     {
4555       if (ivs->n_invariant_uses[i] == 0)
4556         return false;
4557     }
4558
4559   return true;
4560 }
4561
4562 /* Creates change of expressing USE by NEW_CP instead of OLD_CP and chains
4563    it before NEXT_CHANGE.  */
4564
4565 static struct iv_ca_delta *
4566 iv_ca_delta_add (struct iv_use *use, struct cost_pair *old_cp,
4567                  struct cost_pair *new_cp, struct iv_ca_delta *next_change)
4568 {
4569   struct iv_ca_delta *change = XNEW (struct iv_ca_delta);
4570
4571   change->use = use;
4572   change->old_cp = old_cp;
4573   change->new_cp = new_cp;
4574   change->next_change = next_change;
4575
4576   return change;
4577 }
4578
4579 /* Joins two lists of changes L1 and L2.  Destructive -- old lists
4580    are rewritten.  */
4581
4582 static struct iv_ca_delta *
4583 iv_ca_delta_join (struct iv_ca_delta *l1, struct iv_ca_delta *l2)
4584 {
4585   struct iv_ca_delta *last;
4586
4587   if (!l2)
4588     return l1;
4589
4590   if (!l1)
4591     return l2;
4592
4593   for (last = l1; last->next_change; last = last->next_change)
4594     continue;
4595   last->next_change = l2;
4596
4597   return l1;
4598 }
4599
4600 /* Returns candidate by that USE is expressed in IVS.  */
4601
4602 static struct cost_pair *
4603 iv_ca_cand_for_use (struct iv_ca *ivs, struct iv_use *use)
4604 {
4605   return ivs->cand_for_use[use->id];
4606 }
4607
4608 /* Reverse the list of changes DELTA, forming the inverse to it.  */
4609
4610 static struct iv_ca_delta *
4611 iv_ca_delta_reverse (struct iv_ca_delta *delta)
4612 {
4613   struct iv_ca_delta *act, *next, *prev = NULL;
4614   struct cost_pair *tmp;
4615
4616   for (act = delta; act; act = next)
4617     {
4618       next = act->next_change;
4619       act->next_change = prev;
4620       prev = act;
4621
4622       tmp = act->old_cp;
4623       act->old_cp = act->new_cp;
4624       act->new_cp = tmp;
4625     }
4626
4627   return prev;
4628 }
4629
4630 /* Commit changes in DELTA to IVS.  If FORWARD is false, the changes are
4631    reverted instead.  */
4632
4633 static void
4634 iv_ca_delta_commit (struct ivopts_data *data, struct iv_ca *ivs,
4635                     struct iv_ca_delta *delta, bool forward)
4636 {
4637   struct cost_pair *from, *to;
4638   struct iv_ca_delta *act;
4639
4640   if (!forward)
4641     delta = iv_ca_delta_reverse (delta);
4642
4643   for (act = delta; act; act = act->next_change)
4644     {
4645       from = act->old_cp;
4646       to = act->new_cp;
4647       gcc_assert (iv_ca_cand_for_use (ivs, act->use) == from);
4648       iv_ca_set_cp (data, ivs, act->use, to);
4649     }
4650
4651   if (!forward)
4652     iv_ca_delta_reverse (delta);
4653 }
4654
4655 /* Returns true if CAND is used in IVS.  */
4656
4657 static bool
4658 iv_ca_cand_used_p (struct iv_ca *ivs, struct iv_cand *cand)
4659 {
4660   return ivs->n_cand_uses[cand->id] > 0;
4661 }
4662
4663 /* Returns number of induction variable candidates in the set IVS.  */
4664
4665 static unsigned
4666 iv_ca_n_cands (struct iv_ca *ivs)
4667 {
4668   return ivs->n_cands;
4669 }
4670
4671 /* Free the list of changes DELTA.  */
4672
4673 static void
4674 iv_ca_delta_free (struct iv_ca_delta **delta)
4675 {
4676   struct iv_ca_delta *act, *next;
4677
4678   for (act = *delta; act; act = next)
4679     {
4680       next = act->next_change;
4681       free (act);
4682     }
4683
4684   *delta = NULL;
4685 }
4686
4687 /* Allocates new iv candidates assignment.  */
4688
4689 static struct iv_ca *
4690 iv_ca_new (struct ivopts_data *data)
4691 {
4692   struct iv_ca *nw = XNEW (struct iv_ca);
4693
4694   nw->upto = 0;
4695   nw->bad_uses = 0;
4696   nw->cand_for_use = XCNEWVEC (struct cost_pair *, n_iv_uses (data));
4697   nw->n_cand_uses = XCNEWVEC (unsigned, n_iv_cands (data));
4698   nw->cands = BITMAP_ALLOC (NULL);
4699   nw->n_cands = 0;
4700   nw->n_regs = 0;
4701   nw->cand_use_cost = 0;
4702   nw->cand_cost = 0;
4703   nw->n_invariant_uses = XCNEWVEC (unsigned, data->max_inv_id + 1);
4704   nw->cost = 0;
4705
4706   return nw;
4707 }
4708
4709 /* Free memory occupied by the set IVS.  */
4710
4711 static void
4712 iv_ca_free (struct iv_ca **ivs)
4713 {
4714   free ((*ivs)->cand_for_use);
4715   free ((*ivs)->n_cand_uses);
4716   BITMAP_FREE ((*ivs)->cands);
4717   free ((*ivs)->n_invariant_uses);
4718   free (*ivs);
4719   *ivs = NULL;
4720 }
4721
4722 /* Dumps IVS to FILE.  */
4723
4724 static void
4725 iv_ca_dump (struct ivopts_data *data, FILE *file, struct iv_ca *ivs)
4726 {
4727   const char *pref = "  invariants ";
4728   unsigned i;
4729
4730   fprintf (file, "  cost %d\n", iv_ca_cost (ivs));
4731   bitmap_print (file, ivs->cands, "  candidates ","\n");
4732
4733   for (i = 1; i <= data->max_inv_id; i++)
4734     if (ivs->n_invariant_uses[i])
4735       {
4736         fprintf (file, "%s%d", pref, i);
4737         pref = ", ";
4738       }
4739   fprintf (file, "\n");
4740 }
4741
4742 /* Try changing candidate in IVS to CAND for each use.  Return cost of the
4743    new set, and store differences in DELTA.  Number of induction variables
4744    in the new set is stored to N_IVS.  */
4745
4746 static unsigned
4747 iv_ca_extend (struct ivopts_data *data, struct iv_ca *ivs,
4748               struct iv_cand *cand, struct iv_ca_delta **delta,
4749               unsigned *n_ivs)
4750 {
4751   unsigned i, cost;
4752   struct iv_use *use;
4753   struct cost_pair *old_cp, *new_cp;
4754
4755   *delta = NULL;
4756   for (i = 0; i < ivs->upto; i++)
4757     {
4758       use = iv_use (data, i);
4759       old_cp = iv_ca_cand_for_use (ivs, use);
4760
4761       if (old_cp
4762           && old_cp->cand == cand)
4763         continue;
4764
4765       new_cp = get_use_iv_cost (data, use, cand);
4766       if (!new_cp)
4767         continue;
4768
4769       if (!iv_ca_has_deps (ivs, new_cp))
4770         continue;
4771
4772       if (!cheaper_cost_pair (new_cp, old_cp))
4773         continue;
4774
4775       *delta = iv_ca_delta_add (use, old_cp, new_cp, *delta);
4776     }
4777
4778   iv_ca_delta_commit (data, ivs, *delta, true);
4779   cost = iv_ca_cost (ivs);
4780   if (n_ivs)
4781     *n_ivs = iv_ca_n_cands (ivs);
4782   iv_ca_delta_commit (data, ivs, *delta, false);
4783
4784   return cost;
4785 }
4786
4787 /* Try narrowing set IVS by removing CAND.  Return the cost of
4788    the new set and store the differences in DELTA.  */
4789
4790 static unsigned
4791 iv_ca_narrow (struct ivopts_data *data, struct iv_ca *ivs,
4792               struct iv_cand *cand, struct iv_ca_delta **delta)
4793 {
4794   unsigned i, ci;
4795   struct iv_use *use;
4796   struct cost_pair *old_cp, *new_cp, *cp;
4797   bitmap_iterator bi;
4798   struct iv_cand *cnd;
4799   unsigned cost;
4800
4801   *delta = NULL;
4802   for (i = 0; i < n_iv_uses (data); i++)
4803     {
4804       use = iv_use (data, i);
4805
4806       old_cp = iv_ca_cand_for_use (ivs, use);
4807       if (old_cp->cand != cand)
4808         continue;
4809
4810       new_cp = NULL;
4811
4812       if (data->consider_all_candidates)
4813         {
4814           EXECUTE_IF_SET_IN_BITMAP (ivs->cands, 0, ci, bi)
4815             {
4816               if (ci == cand->id)
4817                 continue;
4818
4819               cnd = iv_cand (data, ci);
4820
4821               cp = get_use_iv_cost (data, use, cnd);
4822               if (!cp)
4823                 continue;
4824               if (!iv_ca_has_deps (ivs, cp))
4825                 continue;
4826
4827               if (!cheaper_cost_pair (cp, new_cp))
4828                 continue;
4829
4830               new_cp = cp;
4831             }
4832         }
4833       else
4834         {
4835           EXECUTE_IF_AND_IN_BITMAP (use->related_cands, ivs->cands, 0, ci, bi)
4836             {
4837               if (ci == cand->id)
4838                 continue;
4839
4840               cnd = iv_cand (data, ci);
4841
4842               cp = get_use_iv_cost (data, use, cnd);
4843               if (!cp)
4844                 continue;
4845               if (!iv_ca_has_deps (ivs, cp))
4846                 continue;
4847
4848               if (!cheaper_cost_pair (cp, new_cp))
4849                 continue;
4850
4851               new_cp = cp;
4852             }
4853         }
4854
4855       if (!new_cp)
4856         {
4857           iv_ca_delta_free (delta);
4858           return INFTY;
4859         }
4860
4861       *delta = iv_ca_delta_add (use, old_cp, new_cp, *delta);
4862     }
4863
4864   iv_ca_delta_commit (data, ivs, *delta, true);
4865   cost = iv_ca_cost (ivs);
4866   iv_ca_delta_commit (data, ivs, *delta, false);
4867
4868   return cost;
4869 }
4870
4871 /* Try optimizing the set of candidates IVS by removing candidates different
4872    from to EXCEPT_CAND from it.  Return cost of the new set, and store
4873    differences in DELTA.  */
4874
4875 static unsigned
4876 iv_ca_prune (struct ivopts_data *data, struct iv_ca *ivs,
4877              struct iv_cand *except_cand, struct iv_ca_delta **delta)
4878 {
4879   bitmap_iterator bi;
4880   struct iv_ca_delta *act_delta, *best_delta;
4881   unsigned i, best_cost, acost;
4882   struct iv_cand *cand;
4883
4884   best_delta = NULL;
4885   best_cost = iv_ca_cost (ivs);
4886
4887   EXECUTE_IF_SET_IN_BITMAP (ivs->cands, 0, i, bi)
4888     {
4889       cand = iv_cand (data, i);
4890
4891       if (cand == except_cand)
4892         continue;
4893
4894       acost = iv_ca_narrow (data, ivs, cand, &act_delta);
4895
4896       if (acost < best_cost)
4897         {
4898           best_cost = acost;
4899           iv_ca_delta_free (&best_delta);
4900           best_delta = act_delta;
4901         }
4902       else
4903         iv_ca_delta_free (&act_delta);
4904     }
4905
4906   if (!best_delta)
4907     {
4908       *delta = NULL;
4909       return best_cost;
4910     }
4911
4912   /* Recurse to possibly remove other unnecessary ivs.  */
4913   iv_ca_delta_commit (data, ivs, best_delta, true);
4914   best_cost = iv_ca_prune (data, ivs, except_cand, delta);
4915   iv_ca_delta_commit (data, ivs, best_delta, false);
4916   *delta = iv_ca_delta_join (best_delta, *delta);
4917   return best_cost;
4918 }
4919
4920 /* Tries to extend the sets IVS in the best possible way in order
4921    to express the USE.  */
4922
4923 static bool
4924 try_add_cand_for (struct ivopts_data *data, struct iv_ca *ivs,
4925                   struct iv_use *use)
4926 {
4927   unsigned best_cost, act_cost;
4928   unsigned i;
4929   bitmap_iterator bi;
4930   struct iv_cand *cand;
4931   struct iv_ca_delta *best_delta = NULL, *act_delta;
4932   struct cost_pair *cp;
4933
4934   iv_ca_add_use (data, ivs, use);
4935   best_cost = iv_ca_cost (ivs);
4936
4937   cp = iv_ca_cand_for_use (ivs, use);
4938   if (cp)
4939     {
4940       best_delta = iv_ca_delta_add (use, NULL, cp, NULL);
4941       iv_ca_set_no_cp (data, ivs, use);
4942     }
4943
4944   /* First try important candidates.  Only if it fails, try the specific ones.
4945      Rationale -- in loops with many variables the best choice often is to use
4946      just one generic biv.  If we added here many ivs specific to the uses,
4947      the optimization algorithm later would be likely to get stuck in a local
4948      minimum, thus causing us to create too many ivs.  The approach from
4949      few ivs to more seems more likely to be successful -- starting from few
4950      ivs, replacing an expensive use by a specific iv should always be a
4951      win.  */
4952   EXECUTE_IF_SET_IN_BITMAP (data->important_candidates, 0, i, bi)
4953     {
4954       cand = iv_cand (data, i);
4955
4956       if (iv_ca_cand_used_p (ivs, cand))
4957         continue;
4958
4959       cp = get_use_iv_cost (data, use, cand);
4960       if (!cp)
4961         continue;
4962
4963       iv_ca_set_cp (data, ivs, use, cp);
4964       act_cost = iv_ca_extend (data, ivs, cand, &act_delta, NULL);
4965       iv_ca_set_no_cp (data, ivs, use);
4966       act_delta = iv_ca_delta_add (use, NULL, cp, act_delta);
4967
4968       if (act_cost < best_cost)
4969         {
4970           best_cost = act_cost;
4971
4972           iv_ca_delta_free (&best_delta);
4973           best_delta = act_delta;
4974         }
4975       else
4976         iv_ca_delta_free (&act_delta);
4977     }
4978
4979   if (best_cost == INFTY)
4980     {
4981       for (i = 0; i < use->n_map_members; i++)
4982         {
4983           cp = use->cost_map + i;
4984           cand = cp->cand;
4985           if (!cand)
4986             continue;
4987
4988           /* Already tried this.  */
4989           if (cand->important)
4990             continue;
4991
4992           if (iv_ca_cand_used_p (ivs, cand))
4993             continue;
4994
4995           act_delta = NULL;
4996           iv_ca_set_cp (data, ivs, use, cp);
4997           act_cost = iv_ca_extend (data, ivs, cand, &act_delta, NULL);
4998           iv_ca_set_no_cp (data, ivs, use);
4999           act_delta = iv_ca_delta_add (use, iv_ca_cand_for_use (ivs, use),
5000                                        cp, act_delta);
5001
5002           if (act_cost < best_cost)
5003             {
5004               best_cost = act_cost;
5005
5006               if (best_delta)
5007                 iv_ca_delta_free (&best_delta);
5008               best_delta = act_delta;
5009             }
5010           else
5011             iv_ca_delta_free (&act_delta);
5012         }
5013     }
5014
5015   iv_ca_delta_commit (data, ivs, best_delta, true);
5016   iv_ca_delta_free (&best_delta);
5017
5018   return (best_cost != INFTY);
5019 }
5020
5021 /* Finds an initial assignment of candidates to uses.  */
5022
5023 static struct iv_ca *
5024 get_initial_solution (struct ivopts_data *data)
5025 {
5026   struct iv_ca *ivs = iv_ca_new (data);
5027   unsigned i;
5028
5029   for (i = 0; i < n_iv_uses (data); i++)
5030     if (!try_add_cand_for (data, ivs, iv_use (data, i)))
5031       {
5032         iv_ca_free (&ivs);
5033         return NULL;
5034       }
5035
5036   return ivs;
5037 }
5038
5039 /* Tries to improve set of induction variables IVS.  */
5040
5041 static bool
5042 try_improve_iv_set (struct ivopts_data *data, struct iv_ca *ivs)
5043 {
5044   unsigned i, acost, best_cost = iv_ca_cost (ivs), n_ivs;
5045   struct iv_ca_delta *best_delta = NULL, *act_delta, *tmp_delta;
5046   struct iv_cand *cand;
5047
5048   /* Try extending the set of induction variables by one.  */
5049   for (i = 0; i < n_iv_cands (data); i++)
5050     {
5051       cand = iv_cand (data, i);
5052
5053       if (iv_ca_cand_used_p (ivs, cand))
5054         continue;
5055
5056       acost = iv_ca_extend (data, ivs, cand, &act_delta, &n_ivs);
5057       if (!act_delta)
5058         continue;
5059
5060       /* If we successfully added the candidate and the set is small enough,
5061          try optimizing it by removing other candidates.  */
5062       if (n_ivs <= ALWAYS_PRUNE_CAND_SET_BOUND)
5063         {
5064           iv_ca_delta_commit (data, ivs, act_delta, true);
5065           acost = iv_ca_prune (data, ivs, cand, &tmp_delta);
5066           iv_ca_delta_commit (data, ivs, act_delta, false);
5067           act_delta = iv_ca_delta_join (act_delta, tmp_delta);
5068         }
5069
5070       if (acost < best_cost)
5071         {
5072           best_cost = acost;
5073           iv_ca_delta_free (&best_delta);
5074           best_delta = act_delta;
5075         }
5076       else
5077         iv_ca_delta_free (&act_delta);
5078     }
5079
5080   if (!best_delta)
5081     {
5082       /* Try removing the candidates from the set instead.  */
5083       best_cost = iv_ca_prune (data, ivs, NULL, &best_delta);
5084
5085       /* Nothing more we can do.  */
5086       if (!best_delta)
5087         return false;
5088     }
5089
5090   iv_ca_delta_commit (data, ivs, best_delta, true);
5091   gcc_assert (best_cost == iv_ca_cost (ivs));
5092   iv_ca_delta_free (&best_delta);
5093   return true;
5094 }
5095
5096 /* Attempts to find the optimal set of induction variables.  We do simple
5097    greedy heuristic -- we try to replace at most one candidate in the selected
5098    solution and remove the unused ivs while this improves the cost.  */
5099
5100 static struct iv_ca *
5101 find_optimal_iv_set (struct ivopts_data *data)
5102 {
5103   unsigned i;
5104   struct iv_ca *set;
5105   struct iv_use *use;
5106
5107   /* Get the initial solution.  */
5108   set = get_initial_solution (data);
5109   if (!set)
5110     {
5111       if (dump_file && (dump_flags & TDF_DETAILS))
5112         fprintf (dump_file, "Unable to substitute for ivs, failed.\n");
5113       return NULL;
5114     }
5115
5116   if (dump_file && (dump_flags & TDF_DETAILS))
5117     {
5118       fprintf (dump_file, "Initial set of candidates:\n");
5119       iv_ca_dump (data, dump_file, set);
5120     }
5121
5122   while (try_improve_iv_set (data, set))
5123     {
5124       if (dump_file && (dump_flags & TDF_DETAILS))
5125         {
5126           fprintf (dump_file, "Improved to:\n");
5127           iv_ca_dump (data, dump_file, set);
5128         }
5129     }
5130
5131   if (dump_file && (dump_flags & TDF_DETAILS))
5132     fprintf (dump_file, "Final cost %d\n\n", iv_ca_cost (set));
5133
5134   for (i = 0; i < n_iv_uses (data); i++)
5135     {
5136       use = iv_use (data, i);
5137       use->selected = iv_ca_cand_for_use (set, use)->cand;
5138     }
5139
5140   return set;
5141 }
5142
5143 /* Creates a new induction variable corresponding to CAND.  */
5144
5145 static void
5146 create_new_iv (struct ivopts_data *data, struct iv_cand *cand)
5147 {
5148   block_stmt_iterator incr_pos;
5149   tree base;
5150   bool after = false;
5151
5152   if (!cand->iv)
5153     return;
5154
5155   switch (cand->pos)
5156     {
5157     case IP_NORMAL:
5158       incr_pos = bsi_last (ip_normal_pos (data->current_loop));
5159       break;
5160
5161     case IP_END:
5162       incr_pos = bsi_last (ip_end_pos (data->current_loop));
5163       after = true;
5164       break;
5165
5166     case IP_ORIGINAL:
5167       /* Mark that the iv is preserved.  */
5168       name_info (data, cand->var_before)->preserve_biv = true;
5169       name_info (data, cand->var_after)->preserve_biv = true;
5170
5171       /* Rewrite the increment so that it uses var_before directly.  */
5172       find_interesting_uses_op (data, cand->var_after)->selected = cand;
5173
5174       return;
5175     }
5176
5177   gimple_add_tmp_var (cand->var_before);
5178   add_referenced_var (cand->var_before);
5179
5180   base = unshare_expr (cand->iv->base);
5181
5182   create_iv (base, unshare_expr (cand->iv->step),
5183              cand->var_before, data->current_loop,
5184              &incr_pos, after, &cand->var_before, &cand->var_after);
5185 }
5186
5187 /* Creates new induction variables described in SET.  */
5188
5189 static void
5190 create_new_ivs (struct ivopts_data *data, struct iv_ca *set)
5191 {
5192   unsigned i;
5193   struct iv_cand *cand;
5194   bitmap_iterator bi;
5195
5196   EXECUTE_IF_SET_IN_BITMAP (set->cands, 0, i, bi)
5197     {
5198       cand = iv_cand (data, i);
5199       create_new_iv (data, cand);
5200     }
5201 }
5202
5203 /* Removes statement STMT (real or a phi node).  If INCLUDING_DEFINED_NAME
5204    is true, remove also the ssa name defined by the statement.  */
5205
5206 static void
5207 remove_statement (tree stmt, bool including_defined_name)
5208 {
5209   if (TREE_CODE (stmt) == PHI_NODE)
5210     {
5211       if (!including_defined_name)
5212         {
5213           /* Prevent the ssa name defined by the statement from being removed.  */
5214           SET_PHI_RESULT (stmt, NULL);
5215         }
5216       remove_phi_node (stmt, NULL_TREE);
5217     }
5218   else
5219     {
5220       block_stmt_iterator bsi = bsi_for_stmt (stmt);
5221
5222       bsi_remove (&bsi, true);
5223     }
5224 }
5225
5226 /* Rewrites USE (definition of iv used in a nonlinear expression)
5227    using candidate CAND.  */
5228
5229 static void
5230 rewrite_use_nonlinear_expr (struct ivopts_data *data,
5231                             struct iv_use *use, struct iv_cand *cand)
5232 {
5233   tree comp;
5234   tree op, stmts, tgt, ass;
5235   block_stmt_iterator bsi, pbsi;
5236
5237   /* An important special case -- if we are asked to express value of
5238      the original iv by itself, just exit; there is no need to
5239      introduce a new computation (that might also need casting the
5240      variable to unsigned and back).  */
5241   if (cand->pos == IP_ORIGINAL
5242       && cand->incremented_at == use->stmt)
5243     {
5244       tree step, ctype, utype;
5245       enum tree_code incr_code = PLUS_EXPR;
5246
5247       gcc_assert (TREE_CODE (use->stmt) == MODIFY_EXPR);
5248       gcc_assert (TREE_OPERAND (use->stmt, 0) == cand->var_after);
5249
5250       step = cand->iv->step;
5251       ctype = TREE_TYPE (step);
5252       utype = TREE_TYPE (cand->var_after);
5253       if (TREE_CODE (step) == NEGATE_EXPR)
5254         {
5255           incr_code = MINUS_EXPR;
5256           step = TREE_OPERAND (step, 0);
5257         }
5258
5259       /* Check whether we may leave the computation unchanged.
5260          This is the case only if it does not rely on other
5261          computations in the loop -- otherwise, the computation
5262          we rely upon may be removed in remove_unused_ivs,
5263          thus leading to ICE.  */
5264       op = TREE_OPERAND (use->stmt, 1);
5265       if (TREE_CODE (op) == PLUS_EXPR
5266           || TREE_CODE (op) == MINUS_EXPR)
5267         {
5268           if (TREE_OPERAND (op, 0) == cand->var_before)
5269             op = TREE_OPERAND (op, 1);
5270           else if (TREE_CODE (op) == PLUS_EXPR
5271                    && TREE_OPERAND (op, 1) == cand->var_before)
5272             op = TREE_OPERAND (op, 0);
5273           else
5274             op = NULL_TREE;
5275         }
5276       else
5277         op = NULL_TREE;
5278
5279       if (op
5280           && (TREE_CODE (op) == INTEGER_CST
5281               || operand_equal_p (op, step, 0)))
5282         return;
5283
5284       /* Otherwise, add the necessary computations to express
5285          the iv.  */
5286       op = fold_convert (ctype, cand->var_before);
5287       comp = fold_convert (utype,
5288                            build2 (incr_code, ctype, op,
5289                                    unshare_expr (step)));
5290     }
5291   else
5292     comp = get_computation (data->current_loop, use, cand);
5293
5294   switch (TREE_CODE (use->stmt))
5295     {
5296     case PHI_NODE:
5297       tgt = PHI_RESULT (use->stmt);
5298
5299       /* If we should keep the biv, do not replace it.  */
5300       if (name_info (data, tgt)->preserve_biv)
5301         return;
5302
5303       pbsi = bsi = bsi_start (bb_for_stmt (use->stmt));
5304       while (!bsi_end_p (pbsi)
5305              && TREE_CODE (bsi_stmt (pbsi)) == LABEL_EXPR)
5306         {
5307           bsi = pbsi;
5308           bsi_next (&pbsi);
5309         }
5310       break;
5311
5312     case MODIFY_EXPR:
5313       tgt = TREE_OPERAND (use->stmt, 0);
5314       bsi = bsi_for_stmt (use->stmt);
5315       break;
5316
5317     default:
5318       gcc_unreachable ();
5319     }
5320
5321   op = force_gimple_operand (comp, &stmts, false, SSA_NAME_VAR (tgt));
5322
5323   if (TREE_CODE (use->stmt) == PHI_NODE)
5324     {
5325       if (stmts)
5326         bsi_insert_after (&bsi, stmts, BSI_CONTINUE_LINKING);
5327       ass = build2 (MODIFY_EXPR, TREE_TYPE (tgt), tgt, op);
5328       bsi_insert_after (&bsi, ass, BSI_NEW_STMT);
5329       remove_statement (use->stmt, false);
5330       SSA_NAME_DEF_STMT (tgt) = ass;
5331     }
5332   else
5333     {
5334       if (stmts)
5335         bsi_insert_before (&bsi, stmts, BSI_SAME_STMT);
5336       TREE_OPERAND (use->stmt, 1) = op;
5337     }
5338 }
5339
5340 /* Replaces ssa name in index IDX by its basic variable.  Callback for
5341    for_each_index.  */
5342
5343 static bool
5344 idx_remove_ssa_names (tree base, tree *idx,
5345                       void *data ATTRIBUTE_UNUSED)
5346 {
5347   tree *op;
5348
5349   if (TREE_CODE (*idx) == SSA_NAME)
5350     *idx = SSA_NAME_VAR (*idx);
5351
5352   if (TREE_CODE (base) == ARRAY_REF)
5353     {
5354       op = &TREE_OPERAND (base, 2);
5355       if (*op
5356           && TREE_CODE (*op) == SSA_NAME)
5357         *op = SSA_NAME_VAR (*op);
5358       op = &TREE_OPERAND (base, 3);
5359       if (*op
5360           && TREE_CODE (*op) == SSA_NAME)
5361         *op = SSA_NAME_VAR (*op);
5362     }
5363
5364   return true;
5365 }
5366
5367 /* Unshares REF and replaces ssa names inside it by their basic variables.  */
5368
5369 static tree
5370 unshare_and_remove_ssa_names (tree ref)
5371 {
5372   ref = unshare_expr (ref);
5373   for_each_index (&ref, idx_remove_ssa_names, NULL);
5374
5375   return ref;
5376 }
5377
5378 /* Extract the alias analysis info for the memory reference REF.  There are
5379    several ways how this information may be stored and what precisely is
5380    its semantics depending on the type of the reference, but there always is
5381    somewhere hidden one _DECL node that is used to determine the set of
5382    virtual operands for the reference.  The code below deciphers this jungle
5383    and extracts this single useful piece of information.  */
5384
5385 static tree
5386 get_ref_tag (tree ref, tree orig)
5387 {
5388   tree var = get_base_address (ref);
5389   tree aref = NULL_TREE, tag, sv;
5390   HOST_WIDE_INT offset, size, maxsize;
5391
5392   for (sv = orig; handled_component_p (sv); sv = TREE_OPERAND (sv, 0))
5393     {
5394       aref = get_ref_base_and_extent (sv, &offset, &size, &maxsize);
5395       if (ref)
5396         break;
5397     }
5398
5399   if (aref && SSA_VAR_P (aref) && get_subvars_for_var (aref))
5400     return unshare_expr (sv);
5401
5402   if (!var)
5403     return NULL_TREE;
5404
5405   if (TREE_CODE (var) == INDIRECT_REF)
5406     {
5407       /* If the base is a dereference of a pointer, first check its name memory
5408          tag.  If it does not have one, use its symbol memory tag.  */
5409       var = TREE_OPERAND (var, 0);
5410       if (TREE_CODE (var) != SSA_NAME)
5411         return NULL_TREE;
5412
5413       if (SSA_NAME_PTR_INFO (var))
5414         {
5415           tag = SSA_NAME_PTR_INFO (var)->name_mem_tag;
5416           if (tag)
5417             return tag;
5418         }
5419
5420       var = SSA_NAME_VAR (var);
5421       tag = var_ann (var)->symbol_mem_tag;
5422       gcc_assert (tag != NULL_TREE);
5423       return tag;
5424     }
5425   else
5426     {
5427       if (!DECL_P (var))
5428         return NULL_TREE;
5429
5430       tag = var_ann (var)->symbol_mem_tag;
5431       if (tag)
5432         return tag;
5433
5434       return var;
5435     }
5436 }
5437
5438 /* Copies the reference information from OLD_REF to NEW_REF.  */
5439
5440 static void
5441 copy_ref_info (tree new_ref, tree old_ref)
5442 {
5443   if (TREE_CODE (old_ref) == TARGET_MEM_REF)
5444     copy_mem_ref_info (new_ref, old_ref);
5445   else
5446     {
5447       TMR_ORIGINAL (new_ref) = unshare_and_remove_ssa_names (old_ref);
5448       TMR_TAG (new_ref) = get_ref_tag (old_ref, TMR_ORIGINAL (new_ref));
5449     }
5450 }
5451
5452 /* Rewrites USE (address that is an iv) using candidate CAND.  */
5453
5454 static void
5455 rewrite_use_address (struct ivopts_data *data,
5456                      struct iv_use *use, struct iv_cand *cand)
5457 {
5458   struct affine_tree_combination aff;
5459   block_stmt_iterator bsi = bsi_for_stmt (use->stmt);
5460   tree ref;
5461
5462   get_computation_aff (data->current_loop, use, cand, use->stmt, &aff);
5463   unshare_aff_combination (&aff);
5464
5465   ref = create_mem_ref (&bsi, TREE_TYPE (*use->op_p), &aff);
5466   copy_ref_info (ref, *use->op_p);
5467   *use->op_p = ref;
5468 }
5469
5470 /* Rewrites USE (the condition such that one of the arguments is an iv) using
5471    candidate CAND.  */
5472
5473 static void
5474 rewrite_use_compare (struct ivopts_data *data,
5475                      struct iv_use *use, struct iv_cand *cand)
5476 {
5477   tree comp;
5478   tree *op_p, cond, op, stmts, bound;
5479   block_stmt_iterator bsi = bsi_for_stmt (use->stmt);
5480   enum tree_code compare;
5481   struct cost_pair *cp = get_use_iv_cost (data, use, cand);
5482
5483   bound = cp->value;
5484   if (bound)
5485     {
5486       tree var = var_at_stmt (data->current_loop, cand, use->stmt);
5487       tree var_type = TREE_TYPE (var);
5488
5489       compare = iv_elimination_compare (data, use);
5490       bound = fold_convert (var_type, bound);
5491       op = force_gimple_operand (unshare_expr (bound), &stmts,
5492                                  true, NULL_TREE);
5493
5494       if (stmts)
5495         bsi_insert_before (&bsi, stmts, BSI_SAME_STMT);
5496
5497       *use->op_p = build2 (compare, boolean_type_node, var, op);
5498       update_stmt (use->stmt);
5499       return;
5500     }
5501
5502   /* The induction variable elimination failed; just express the original
5503      giv.  */
5504   comp = get_computation (data->current_loop, use, cand);
5505
5506   cond = *use->op_p;
5507   op_p = &TREE_OPERAND (cond, 0);
5508   if (TREE_CODE (*op_p) != SSA_NAME
5509       || zero_p (get_iv (data, *op_p)->step))
5510     op_p = &TREE_OPERAND (cond, 1);
5511
5512   op = force_gimple_operand (comp, &stmts, true, SSA_NAME_VAR (*op_p));
5513   if (stmts)
5514     bsi_insert_before (&bsi, stmts, BSI_SAME_STMT);
5515
5516   *op_p = op;
5517 }
5518
5519 /* Rewrites USE using candidate CAND.  */
5520
5521 static void
5522 rewrite_use (struct ivopts_data *data,
5523              struct iv_use *use, struct iv_cand *cand)
5524 {
5525   switch (use->type)
5526     {
5527       case USE_NONLINEAR_EXPR:
5528         rewrite_use_nonlinear_expr (data, use, cand);
5529         break;
5530
5531       case USE_ADDRESS:
5532         rewrite_use_address (data, use, cand);
5533         break;
5534
5535       case USE_COMPARE:
5536         rewrite_use_compare (data, use, cand);
5537         break;
5538
5539       default:
5540         gcc_unreachable ();
5541     }
5542   mark_new_vars_to_rename (use->stmt);
5543 }
5544
5545 /* Rewrite the uses using the selected induction variables.  */
5546
5547 static void
5548 rewrite_uses (struct ivopts_data *data)
5549 {
5550   unsigned i;
5551   struct iv_cand *cand;
5552   struct iv_use *use;
5553
5554   for (i = 0; i < n_iv_uses (data); i++)
5555     {
5556       use = iv_use (data, i);
5557       cand = use->selected;
5558       gcc_assert (cand);
5559
5560       rewrite_use (data, use, cand);
5561     }
5562 }
5563
5564 /* Removes the ivs that are not used after rewriting.  */
5565
5566 static void
5567 remove_unused_ivs (struct ivopts_data *data)
5568 {
5569   unsigned j;
5570   bitmap_iterator bi;
5571
5572   EXECUTE_IF_SET_IN_BITMAP (data->relevant, 0, j, bi)
5573     {
5574       struct version_info *info;
5575
5576       info = ver_info (data, j);
5577       if (info->iv
5578           && !zero_p (info->iv->step)
5579           && !info->inv_id
5580           && !info->iv->have_use_for
5581           && !info->preserve_biv)
5582         remove_statement (SSA_NAME_DEF_STMT (info->iv->ssa_name), true);
5583     }
5584 }
5585
5586 /* Frees data allocated by the optimization of a single loop.  */
5587
5588 static void
5589 free_loop_data (struct ivopts_data *data)
5590 {
5591   unsigned i, j;
5592   bitmap_iterator bi;
5593   tree obj;
5594
5595   htab_empty (data->niters);
5596
5597   EXECUTE_IF_SET_IN_BITMAP (data->relevant, 0, i, bi)
5598     {
5599       struct version_info *info;
5600
5601       info = ver_info (data, i);
5602       if (info->iv)
5603         free (info->iv);
5604       info->iv = NULL;
5605       info->has_nonlin_use = false;
5606       info->preserve_biv = false;
5607       info->inv_id = 0;
5608     }
5609   bitmap_clear (data->relevant);
5610   bitmap_clear (data->important_candidates);
5611
5612   for (i = 0; i < n_iv_uses (data); i++)
5613     {
5614       struct iv_use *use = iv_use (data, i);
5615
5616       free (use->iv);
5617       BITMAP_FREE (use->related_cands);
5618       for (j = 0; j < use->n_map_members; j++)
5619         if (use->cost_map[j].depends_on)
5620           BITMAP_FREE (use->cost_map[j].depends_on);
5621       free (use->cost_map);
5622       free (use);
5623     }
5624   VEC_truncate (iv_use_p, data->iv_uses, 0);
5625
5626   for (i = 0; i < n_iv_cands (data); i++)
5627     {
5628       struct iv_cand *cand = iv_cand (data, i);
5629
5630       if (cand->iv)
5631         free (cand->iv);
5632       if (cand->depends_on)
5633         BITMAP_FREE (cand->depends_on);
5634       free (cand);
5635     }
5636   VEC_truncate (iv_cand_p, data->iv_candidates, 0);
5637
5638   if (data->version_info_size < num_ssa_names)
5639     {
5640       data->version_info_size = 2 * num_ssa_names;
5641       free (data->version_info);
5642       data->version_info = XCNEWVEC (struct version_info, data->version_info_size);
5643     }
5644
5645   data->max_inv_id = 0;
5646
5647   for (i = 0; VEC_iterate (tree, decl_rtl_to_reset, i, obj); i++)
5648     SET_DECL_RTL (obj, NULL_RTX);
5649
5650   VEC_truncate (tree, decl_rtl_to_reset, 0);
5651 }
5652
5653 /* Finalizes data structures used by the iv optimization pass.  LOOPS is the
5654    loop tree.  */
5655
5656 static void
5657 tree_ssa_iv_optimize_finalize (struct ivopts_data *data)
5658 {
5659   free_loop_data (data);
5660   free (data->version_info);
5661   BITMAP_FREE (data->relevant);
5662   BITMAP_FREE (data->important_candidates);
5663   htab_delete (data->niters);
5664
5665   VEC_free (tree, heap, decl_rtl_to_reset);
5666   VEC_free (iv_use_p, heap, data->iv_uses);
5667   VEC_free (iv_cand_p, heap, data->iv_candidates);
5668 }
5669
5670 /* Optimizes the LOOP.  Returns true if anything changed.  */
5671
5672 static bool
5673 tree_ssa_iv_optimize_loop (struct ivopts_data *data, struct loop *loop)
5674 {
5675   bool changed = false;
5676   struct iv_ca *iv_ca;
5677   edge exit;
5678
5679   data->current_loop = loop;
5680
5681   if (dump_file && (dump_flags & TDF_DETAILS))
5682     {
5683       fprintf (dump_file, "Processing loop %d\n", loop->num);
5684
5685       exit = single_dom_exit (loop);
5686       if (exit)
5687         {
5688           fprintf (dump_file, "  single exit %d -> %d, exit condition ",
5689                    exit->src->index, exit->dest->index);
5690           print_generic_expr (dump_file, last_stmt (exit->src), TDF_SLIM);
5691           fprintf (dump_file, "\n");
5692         }
5693
5694       fprintf (dump_file, "\n");
5695     }
5696
5697   /* For each ssa name determines whether it behaves as an induction variable
5698      in some loop.  */
5699   if (!find_induction_variables (data))
5700     goto finish;
5701
5702   /* Finds interesting uses (item 1).  */
5703   find_interesting_uses (data);
5704   if (n_iv_uses (data) > MAX_CONSIDERED_USES)
5705     goto finish;
5706
5707   /* Finds candidates for the induction variables (item 2).  */
5708   find_iv_candidates (data);
5709
5710   /* Calculates the costs (item 3, part 1).  */
5711   determine_use_iv_costs (data);
5712   determine_iv_costs (data);
5713   determine_set_costs (data);
5714
5715   /* Find the optimal set of induction variables (item 3, part 2).  */
5716   iv_ca = find_optimal_iv_set (data);
5717   if (!iv_ca)
5718     goto finish;
5719   changed = true;
5720
5721   /* Create the new induction variables (item 4, part 1).  */
5722   create_new_ivs (data, iv_ca);
5723   iv_ca_free (&iv_ca);
5724
5725   /* Rewrite the uses (item 4, part 2).  */
5726   rewrite_uses (data);
5727
5728   /* Remove the ivs that are unused after rewriting.  */
5729   remove_unused_ivs (data);
5730
5731   /* We have changed the structure of induction variables; it might happen
5732      that definitions in the scev database refer to some of them that were
5733      eliminated.  */
5734   scev_reset ();
5735
5736 finish:
5737   free_loop_data (data);
5738
5739   return changed;
5740 }
5741
5742 /* Main entry point.  Optimizes induction variables in LOOPS.  */
5743
5744 void
5745 tree_ssa_iv_optimize (struct loops *loops)
5746 {
5747   struct loop *loop;
5748   struct ivopts_data data;
5749
5750   tree_ssa_iv_optimize_init (&data);
5751
5752   /* Optimize the loops starting with the innermost ones.  */
5753   loop = loops->tree_root;
5754   while (loop->inner)
5755     loop = loop->inner;
5756
5757   /* Scan the loops, inner ones first.  */
5758   while (loop != loops->tree_root)
5759     {
5760       if (dump_file && (dump_flags & TDF_DETAILS))
5761         flow_loop_dump (loop, dump_file, NULL, 1);
5762
5763       tree_ssa_iv_optimize_loop (&data, loop);
5764
5765       if (loop->next)
5766         {
5767           loop = loop->next;
5768           while (loop->inner)
5769             loop = loop->inner;
5770         }
5771       else
5772         loop = loop->outer;
5773     }
5774
5775   tree_ssa_iv_optimize_finalize (&data);
5776 }