gcc/loop.c

   1 /* Perform various loop optimizations, including strength reduction.
   2    Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995,
   3    1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005
   4    Free Software Foundation, Inc.
   5
   6 This file is part of GCC.
   7
   8 GCC is free software; you can redistribute it and/or modify it under
   9 the terms of the GNU General Public License as published by the Free
  10 Software Foundation; either version 2, or (at your option) any later
  11 version.
  12
  13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  16 for more details.
  17
  18 You should have received a copy of the GNU General Public License
  19 along with GCC; see the file COPYING.  If not, write to the Free
  20 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  21 02111-1307, USA.  */
  22
  23 /* This is the loop optimization pass of the compiler.
  24    It finds invariant computations within loops and moves them
  25    to the beginning of the loop.  Then it identifies basic and
  26    general induction variables.
  27
  28    Basic induction variables (BIVs) are a pseudo registers which are set within
  29    a loop only by incrementing or decrementing its value.  General induction
  30    variables (GIVs) are pseudo registers with a value which is a linear function
  31    of a basic induction variable.  BIVs are recognized by `basic_induction_var';
  32    GIVs by `general_induction_var'.
  33
  34    Once induction variables are identified, strength reduction is applied to the
  35    general induction variables, and induction variable elimination is applied to
  36    the basic induction variables.
  37
  38    It also finds cases where
  39    a register is set within the loop by zero-extending a narrower value
  40    and changes these to zero the entire register once before the loop
  41    and merely copy the low part within the loop.
  42
  43    Most of the complexity is in heuristics to decide when it is worth
  44    while to do these things.  */
  45
  46 #include "config.h"
  47 #include "system.h"
  48 #include "coretypes.h"
  49 #include "tm.h"
  50 #include "rtl.h"
  51 #include "tm_p.h"
  52 #include "function.h"
  53 #include "expr.h"
  54 #include "hard-reg-set.h"
  55 #include "basic-block.h"
  56 #include "insn-config.h"
  57 #include "regs.h"
  58 #include "recog.h"
  59 #include "flags.h"
  60 #include "real.h"
  61 #include "cselib.h"
  62 #include "except.h"
  63 #include "toplev.h"
  64 #include "predict.h"
  65 #include "insn-flags.h"
  66 #include "optabs.h"
  67 #include "cfgloop.h"
  68 #include "ggc.h"
  69
  70 /* Get the loop info pointer of a loop.  */
  71 #define LOOP_INFO(LOOP) ((struct loop_info *) (LOOP)->aux)
  72
  73 /* Get a pointer to the loop movables structure.  */
  74 #define LOOP_MOVABLES(LOOP) (&LOOP_INFO (LOOP)->movables)
  75
  76 /* Get a pointer to the loop registers structure.  */
  77 #define LOOP_REGS(LOOP) (&LOOP_INFO (LOOP)->regs)
  78
  79 /* Get a pointer to the loop induction variables structure.  */
  80 #define LOOP_IVS(LOOP) (&LOOP_INFO (LOOP)->ivs)
  81
  82 /* Get the luid of an insn.  Catch the error of trying to reference the LUID
  83    of an insn added during loop, since these don't have LUIDs.  */
  84
  85 #define INSN_LUID(INSN)                 \
  86   (gcc_assert (INSN_UID (INSN) < max_uid_for_loop), uid_luid[INSN_UID (INSN)])
  87
  88 #define REGNO_FIRST_LUID(REGNO)                 \
  89   (REGNO_FIRST_UID (REGNO) < max_uid_for_loop   \
  90         ? uid_luid[REGNO_FIRST_UID (REGNO)]     \
  91         : 0)
  92 #define REGNO_LAST_LUID(REGNO)                  \
  93   (REGNO_LAST_UID (REGNO) < max_uid_for_loop    \
  94         ? uid_luid[REGNO_LAST_UID (REGNO)]      \
  95         : INT_MAX)
  96
  97 /* A "basic induction variable" or biv is a pseudo reg that is set
  98    (within this loop) only by incrementing or decrementing it.  */
  99 /* A "general induction variable" or giv is a pseudo reg whose
 100    value is a linear function of a biv.  */
 101
 102 /* Bivs are recognized by `basic_induction_var';
 103    Givs by `general_induction_var'.  */
 104
 105 /* An enum for the two different types of givs, those that are used
 106    as memory addresses and those that are calculated into registers.  */
 107 enum g_types
 108 {
 109   DEST_ADDR,
 110   DEST_REG
 111 };
 112
 113
 114 /* A `struct induction' is created for every instruction that sets
 115    an induction variable (either a biv or a giv).  */
 116
 117 struct induction
 118 {
 119   rtx insn;                     /* The insn that sets a biv or giv */
 120   rtx new_reg;                  /* New register, containing strength reduced
 121                                    version of this giv.  */
 122   rtx src_reg;                  /* Biv from which this giv is computed.
 123                                    (If this is a biv, then this is the biv.) */
 124   enum g_types giv_type;        /* Indicate whether DEST_ADDR or DEST_REG */
 125   rtx dest_reg;                 /* Destination register for insn: this is the
 126                                    register which was the biv or giv.
 127                                    For a biv, this equals src_reg.
 128                                    For a DEST_ADDR type giv, this is 0.  */
 129   rtx *location;                /* Place in the insn where this giv occurs.
 130                                    If GIV_TYPE is DEST_REG, this is 0.  */
 131                                 /* For a biv, this is the place where add_val
 132                                    was found.  */
 133   enum machine_mode mode;       /* The mode of this biv or giv */
 134   rtx mem;                      /* For DEST_ADDR, the memory object.  */
 135   rtx mult_val;                 /* Multiplicative factor for src_reg.  */
 136   rtx add_val;                  /* Additive constant for that product.  */
 137   int benefit;                  /* Gain from eliminating this insn.  */
 138   rtx final_value;              /* If the giv is used outside the loop, and its
 139                                    final value could be calculated, it is put
 140                                    here, and the giv is made replaceable.  Set
 141                                    the giv to this value before the loop.  */
 142   unsigned combined_with;       /* The number of givs this giv has been
 143                                    combined with.  If nonzero, this giv
 144                                    cannot combine with any other giv.  */
 145   unsigned replaceable : 1;     /* 1 if we can substitute the strength-reduced
 146                                    variable for the original variable.
 147                                    0 means they must be kept separate and the
 148                                    new one must be copied into the old pseudo
 149                                    reg each time the old one is set.  */
 150   unsigned not_replaceable : 1; /* Used to prevent duplicating work.  This is
 151                                    1 if we know that the giv definitely can
 152                                    not be made replaceable, in which case we
 153                                    don't bother checking the variable again
 154                                    even if further info is available.
 155                                    Both this and the above can be zero.  */
 156   unsigned ignore : 1;          /* 1 prohibits further processing of giv */
 157   unsigned always_computable : 1;/* 1 if this value is computable every
 158                                     iteration.  */
 159   unsigned always_executed : 1; /* 1 if this set occurs each iteration.  */
 160   unsigned maybe_multiple : 1;  /* Only used for a biv and  1 if this biv
 161                                    update may be done multiple times per
 162                                    iteration.  */
 163   unsigned cant_derive : 1;     /* For giv's, 1 if this giv cannot derive
 164                                    another giv.  This occurs in many cases
 165                                    where a giv's lifetime spans an update to
 166                                    a biv.  */
 167   unsigned maybe_dead : 1;      /* 1 if this giv might be dead.  In that case,
 168                                    we won't use it to eliminate a biv, it
 169                                    would probably lose.  */
 170   unsigned auto_inc_opt : 1;    /* 1 if this giv had its increment output next
 171                                    to it to try to form an auto-inc address.  */
 172   unsigned shared : 1;
 173   unsigned no_const_addval : 1; /* 1 if add_val does not contain a const.  */
 174   int lifetime;                 /* Length of life of this giv */
 175   rtx derive_adjustment;        /* If nonzero, is an adjustment to be
 176                                    subtracted from add_val when this giv
 177                                    derives another.  This occurs when the
 178                                    giv spans a biv update by incrementation.  */
 179   rtx ext_dependent;            /* If nonzero, is a sign or zero extension
 180                                    if a biv on which this giv is dependent.  */
 181   struct induction *next_iv;    /* For givs, links together all givs that are
 182                                    based on the same biv.  For bivs, links
 183                                    together all biv entries that refer to the
 184                                    same biv register.  */
 185   struct induction *same;       /* For givs, if the giv has been combined with
 186                                    another giv, this points to the base giv.
 187                                    The base giv will have COMBINED_WITH nonzero.
 188                                    For bivs, if the biv has the same LOCATION
 189                                    than another biv, this points to the base
 190                                    biv.  */
 191   struct induction *same_insn;  /* If there are multiple identical givs in
 192                                    the same insn, then all but one have this
 193                                    field set, and they all point to the giv
 194                                    that doesn't have this field set.  */
 195   rtx last_use;                 /* For a giv made from a biv increment, this is
 196                                    a substitute for the lifetime information.  */
 197 };
 198
 199
 200 /* A `struct iv_class' is created for each biv.  */
 201
 202 struct iv_class
 203 {
 204   unsigned int regno;           /* Pseudo reg which is the biv.  */
 205   int biv_count;                /* Number of insns setting this reg.  */
 206   struct induction *biv;        /* List of all insns that set this reg.  */
 207   int giv_count;                /* Number of DEST_REG givs computed from this
 208                                    biv.  The resulting count is only used in
 209                                    check_dbra_loop.  */
 210   struct induction *giv;        /* List of all insns that compute a giv
 211                                    from this reg.  */
 212   int total_benefit;            /* Sum of BENEFITs of all those givs.  */
 213   rtx initial_value;            /* Value of reg at loop start.  */
 214   rtx initial_test;             /* Test performed on BIV before loop.  */
 215   rtx final_value;              /* Value of reg at loop end, if known.  */
 216   struct iv_class *next;        /* Links all class structures together.  */
 217   rtx init_insn;                /* insn which initializes biv, 0 if none.  */
 218   rtx init_set;                 /* SET of INIT_INSN, if any.  */
 219   unsigned incremented : 1;     /* 1 if somewhere incremented/decremented */
 220   unsigned eliminable : 1;      /* 1 if plausible candidate for
 221                                    elimination.  */
 222   unsigned nonneg : 1;          /* 1 if we added a REG_NONNEG note for
 223                                    this.  */
 224   unsigned reversed : 1;        /* 1 if we reversed the loop that this
 225                                    biv controls.  */
 226   unsigned all_reduced : 1;     /* 1 if all givs using this biv have
 227                                    been reduced.  */
 228 };
 229
 230
 231 /* Definitions used by the basic induction variable discovery code.  */
 232 enum iv_mode
 233 {
 234   UNKNOWN_INDUCT,
 235   BASIC_INDUCT,
 236   NOT_BASIC_INDUCT,
 237   GENERAL_INDUCT
 238 };
 239
 240
 241 /* A `struct iv' is created for every register.  */
 242
 243 struct iv
 244 {
 245   enum iv_mode type;
 246   union
 247   {
 248     struct iv_class *class;
 249     struct induction *info;
 250   } iv;
 251 };
 252
 253
 254 #define REG_IV_TYPE(ivs, n) ivs->regs[n].type
 255 #define REG_IV_INFO(ivs, n) ivs->regs[n].iv.info
 256 #define REG_IV_CLASS(ivs, n) ivs->regs[n].iv.class
 257
 258
 259 struct loop_ivs
 260 {
 261   /* Indexed by register number, contains pointer to `struct
 262      iv' if register is an induction variable.  */
 263   struct iv *regs;
 264
 265   /* Size of regs array.  */
 266   unsigned int n_regs;
 267
 268   /* The head of a list which links together (via the next field)
 269      every iv class for the current loop.  */
 270   struct iv_class *list;
 271 };
 272
 273
 274 typedef struct loop_mem_info
 275 {
 276   rtx mem;      /* The MEM itself.  */
 277   rtx reg;      /* Corresponding pseudo, if any.  */
 278   int optimize; /* Nonzero if we can optimize access to this MEM.  */
 279 } loop_mem_info;
 280
 281
 282
 283 struct loop_reg
 284 {
 285   /* Number of times the reg is set during the loop being scanned.
 286      During code motion, a negative value indicates a reg that has
 287      been made a candidate; in particular -2 means that it is an
 288      candidate that we know is equal to a constant and -1 means that
 289      it is a candidate not known equal to a constant.  After code
 290      motion, regs moved have 0 (which is accurate now) while the
 291      failed candidates have the original number of times set.
 292
 293      Therefore, at all times, == 0 indicates an invariant register;
 294      < 0 a conditionally invariant one.  */
 295   int set_in_loop;
 296
 297   /* Original value of set_in_loop; same except that this value
 298      is not set negative for a reg whose sets have been made candidates
 299      and not set to 0 for a reg that is moved.  */
 300   int n_times_set;
 301
 302   /* Contains the insn in which a register was used if it was used
 303      exactly once; contains const0_rtx if it was used more than once.  */
 304   rtx single_usage;
 305
 306   /* Nonzero indicates that the register cannot be moved or strength
 307      reduced.  */
 308   char may_not_optimize;
 309
 310   /* Nonzero means reg N has already been moved out of one loop.
 311      This reduces the desire to move it out of another.  */
 312   char moved_once;
 313 };
 314
 315
 316 struct loop_regs
 317 {
 318   int num;                      /* Number of regs used in table.  */
 319   int size;                     /* Size of table.  */
 320   struct loop_reg *array;       /* Register usage info. array.  */
 321   int multiple_uses;            /* Nonzero if a reg has multiple uses.  */
 322 };
 323
 324
 325
 326 struct loop_movables
 327 {
 328   /* Head of movable chain.  */
 329   struct movable *head;
 330   /* Last movable in chain.  */
 331   struct movable *last;
 332 };
 333
 334
 335 /* Information pertaining to a loop.  */
 336
 337 struct loop_info
 338 {
 339   /* Nonzero if there is a subroutine call in the current loop.  */
 340   int has_call;
 341   /* Nonzero if there is a libcall in the current loop.  */
 342   int has_libcall;
 343   /* Nonzero if there is a non constant call in the current loop.  */
 344   int has_nonconst_call;
 345   /* Nonzero if there is a prefetch instruction in the current loop.  */
 346   int has_prefetch;
 347   /* Nonzero if there is a volatile memory reference in the current
 348      loop.  */
 349   int has_volatile;
 350   /* Nonzero if there is a tablejump in the current loop.  */
 351   int has_tablejump;
 352   /* Nonzero if there are ways to leave the loop other than falling
 353      off the end.  */
 354   int has_multiple_exit_targets;
 355   /* Nonzero if there is an indirect jump in the current function.  */
 356   int has_indirect_jump;
 357   /* Register or constant initial loop value.  */
 358   rtx initial_value;
 359   /* Register or constant value used for comparison test.  */
 360   rtx comparison_value;
 361   /* Register or constant approximate final value.  */
 362   rtx final_value;
 363   /* Register or constant initial loop value with term common to
 364      final_value removed.  */
 365   rtx initial_equiv_value;
 366   /* Register or constant final loop value with term common to
 367      initial_value removed.  */
 368   rtx final_equiv_value;
 369   /* Register corresponding to iteration variable.  */
 370   rtx iteration_var;
 371   /* Constant loop increment.  */
 372   rtx increment;
 373   enum rtx_code comparison_code;
 374   /* Holds the number of loop iterations.  It is zero if the number
 375      could not be calculated.  Must be unsigned since the number of
 376      iterations can be as high as 2^wordsize - 1.  For loops with a
 377      wider iterator, this number will be zero if the number of loop
 378      iterations is too large for an unsigned integer to hold.  */
 379   unsigned HOST_WIDE_INT n_iterations;
 380   int used_count_register;
 381   /* The loop iterator induction variable.  */
 382   struct iv_class *iv;
 383   /* List of MEMs that are stored in this loop.  */
 384   rtx store_mems;
 385   /* Array of MEMs that are used (read or written) in this loop, but
 386      cannot be aliased by anything in this loop, except perhaps
 387      themselves.  In other words, if mems[i] is altered during
 388      the loop, it is altered by an expression that is rtx_equal_p to
 389      it.  */
 390   loop_mem_info *mems;
 391   /* The index of the next available slot in MEMS.  */
 392   int mems_idx;
 393   /* The number of elements allocated in MEMS.  */
 394   int mems_allocated;
 395   /* Nonzero if we don't know what MEMs were changed in the current
 396      loop.  This happens if the loop contains a call (in which case
 397      `has_call' will also be set) or if we store into more than
 398      NUM_STORES MEMs.  */
 399   int unknown_address_altered;
 400   /* The above doesn't count any readonly memory locations that are
 401      stored.  This does.  */
 402   int unknown_constant_address_altered;
 403   /* Count of memory write instructions discovered in the loop.  */
 404   int num_mem_sets;
 405   /* The insn where the first of these was found.  */
 406   rtx first_loop_store_insn;
 407   /* The chain of movable insns in loop.  */
 408   struct loop_movables movables;
 409   /* The registers used the in loop.  */
 410   struct loop_regs regs;
 411   /* The induction variable information in loop.  */
 412   struct loop_ivs ivs;
 413   /* Nonzero if call is in pre_header extended basic block.  */
 414   int pre_header_has_call;
 415 };
 416
 417 /* Not really meaningful values, but at least something.  */
 418 #ifndef SIMULTANEOUS_PREFETCHES
 419 #define SIMULTANEOUS_PREFETCHES 3
 420 #endif
 421 #ifndef PREFETCH_BLOCK
 422 #define PREFETCH_BLOCK 32
 423 #endif
 424 #ifndef HAVE_prefetch
 425 #define HAVE_prefetch 0
 426 #define CODE_FOR_prefetch 0
 427 #define gen_prefetch(a,b,c) (abort(), NULL_RTX)
 428 #endif
 429
 430 /* Give up the prefetch optimizations once we exceed a given threshold.
 431    It is unlikely that we would be able to optimize something in a loop
 432    with so many detected prefetches.  */
 433 #define MAX_PREFETCHES 100
 434 /* The number of prefetch blocks that are beneficial to fetch at once before
 435    a loop with a known (and low) iteration count.  */
 436 #define PREFETCH_BLOCKS_BEFORE_LOOP_MAX  6
 437 /* For very tiny loops it is not worthwhile to prefetch even before the loop,
 438    since it is likely that the data are already in the cache.  */
 439 #define PREFETCH_BLOCKS_BEFORE_LOOP_MIN  2
 440
 441 /* Parameterize some prefetch heuristics so they can be turned on and off
 442    easily for performance testing on new architectures.  These can be
 443    defined in target-dependent files.  */
 444
 445 /* Prefetch is worthwhile only when loads/stores are dense.  */
 446 #ifndef PREFETCH_ONLY_DENSE_MEM
 447 #define PREFETCH_ONLY_DENSE_MEM 1
 448 #endif
 449
 450 /* Define what we mean by "dense" loads and stores; This value divided by 256
 451    is the minimum percentage of memory references that worth prefetching.  */
 452 #ifndef PREFETCH_DENSE_MEM
 453 #define PREFETCH_DENSE_MEM 220
 454 #endif
 455
 456 /* Do not prefetch for a loop whose iteration count is known to be low.  */
 457 #ifndef PREFETCH_NO_LOW_LOOPCNT
 458 #define PREFETCH_NO_LOW_LOOPCNT 1
 459 #endif
 460
 461 /* Define what we mean by a "low" iteration count.  */
 462 #ifndef PREFETCH_LOW_LOOPCNT
 463 #define PREFETCH_LOW_LOOPCNT 32
 464 #endif
 465
 466 /* Do not prefetch for a loop that contains a function call; such a loop is
 467    probably not an internal loop.  */
 468 #ifndef PREFETCH_NO_CALL
 469 #define PREFETCH_NO_CALL 1
 470 #endif
 471
 472 /* Do not prefetch accesses with an extreme stride.  */
 473 #ifndef PREFETCH_NO_EXTREME_STRIDE
 474 #define PREFETCH_NO_EXTREME_STRIDE 1
 475 #endif
 476
 477 /* Define what we mean by an "extreme" stride.  */
 478 #ifndef PREFETCH_EXTREME_STRIDE
 479 #define PREFETCH_EXTREME_STRIDE 4096
 480 #endif
 481
 482 /* Define a limit to how far apart indices can be and still be merged
 483    into a single prefetch.  */
 484 #ifndef PREFETCH_EXTREME_DIFFERENCE
 485 #define PREFETCH_EXTREME_DIFFERENCE 4096
 486 #endif
 487
 488 /* Issue prefetch instructions before the loop to fetch data to be used
 489    in the first few loop iterations.  */
 490 #ifndef PREFETCH_BEFORE_LOOP
 491 #define PREFETCH_BEFORE_LOOP 1
 492 #endif
 493
 494 /* Do not handle reversed order prefetches (negative stride).  */
 495 #ifndef PREFETCH_NO_REVERSE_ORDER
 496 #define PREFETCH_NO_REVERSE_ORDER 1
 497 #endif
 498
 499 /* Prefetch even if the GIV is in conditional code.  */
 500 #ifndef PREFETCH_CONDITIONAL
 501 #define PREFETCH_CONDITIONAL 1
 502 #endif
 503
 504 #define LOOP_REG_LIFETIME(LOOP, REGNO) \
 505 ((REGNO_LAST_LUID (REGNO) - REGNO_FIRST_LUID (REGNO)))
 506
 507 #define LOOP_REG_GLOBAL_P(LOOP, REGNO) \
 508 ((REGNO_LAST_LUID (REGNO) > INSN_LUID ((LOOP)->end) \
 509  || REGNO_FIRST_LUID (REGNO) < INSN_LUID ((LOOP)->start)))
 510
 511 #define LOOP_REGNO_NREGS(REGNO, SET_DEST) \
 512 ((REGNO) < FIRST_PSEUDO_REGISTER \
 513  ? (int) hard_regno_nregs[(REGNO)][GET_MODE (SET_DEST)] : 1)
 514
 515
 516 /* Vector mapping INSN_UIDs to luids.
 517    The luids are like uids but increase monotonically always.
 518    We use them to see whether a jump comes from outside a given loop.  */
 519
 520 static int *uid_luid;
 521
 522 /* Indexed by INSN_UID, contains the ordinal giving the (innermost) loop
 523    number the insn is contained in.  */
 524
 525 static struct loop **uid_loop;
 526
 527 /* 1 + largest uid of any insn.  */
 528
 529 static int max_uid_for_loop;
 530
 531 /* Number of loops detected in current function.  Used as index to the
 532    next few tables.  */
 533
 534 static int max_loop_num;
 535
 536 /* Bound on pseudo register number before loop optimization.
 537    A pseudo has valid regscan info if its number is < max_reg_before_loop.  */
 538 static unsigned int max_reg_before_loop;
 539
 540 /* The value to pass to the next call of reg_scan_update.  */
 541 static int loop_max_reg;
 542 \f
 543 /* During the analysis of a loop, a chain of `struct movable's
 544    is made to record all the movable insns found.
 545    Then the entire chain can be scanned to decide which to move.  */
 546
 547 struct movable
 548 {
 549   rtx insn;                     /* A movable insn */
 550   rtx set_src;                  /* The expression this reg is set from.  */
 551   rtx set_dest;                 /* The destination of this SET.  */
 552   rtx dependencies;             /* When INSN is libcall, this is an EXPR_LIST
 553                                    of any registers used within the LIBCALL.  */
 554   int consec;                   /* Number of consecutive following insns
 555                                    that must be moved with this one.  */
 556   unsigned int regno;           /* The register it sets */
 557   short lifetime;               /* lifetime of that register;
 558                                    may be adjusted when matching movables
 559                                    that load the same value are found.  */
 560   short savings;                /* Number of insns we can move for this reg,
 561                                    including other movables that force this
 562                                    or match this one.  */
 563   ENUM_BITFIELD(machine_mode) savemode : 8;   /* Nonzero means it is a mode for
 564                                    a low part that we should avoid changing when
 565                                    clearing the rest of the reg.  */
 566   unsigned int cond : 1;        /* 1 if only conditionally movable */
 567   unsigned int force : 1;       /* 1 means MUST move this insn */
 568   unsigned int global : 1;      /* 1 means reg is live outside this loop */
 569                 /* If PARTIAL is 1, GLOBAL means something different:
 570                    that the reg is live outside the range from where it is set
 571                    to the following label.  */
 572   unsigned int done : 1;        /* 1 inhibits further processing of this */
 573
 574   unsigned int partial : 1;     /* 1 means this reg is used for zero-extending.
 575                                    In particular, moving it does not make it
 576                                    invariant.  */
 577   unsigned int move_insn : 1;   /* 1 means that we call emit_move_insn to
 578                                    load SRC, rather than copying INSN.  */
 579   unsigned int move_insn_first:1;/* Same as above, if this is necessary for the
 580                                     first insn of a consecutive sets group.  */
 581   unsigned int is_equiv : 1;    /* 1 means a REG_EQUIV is present on INSN.  */
 582   unsigned int insert_temp : 1;  /* 1 means we copy to a new pseudo and replace
 583                                     the original insn with a copy from that
 584                                     pseudo, rather than deleting it.  */
 585   struct movable *match;        /* First entry for same value */
 586   struct movable *forces;       /* An insn that must be moved if this is */
 587   struct movable *next;
 588 };
 589
 590
 591 static FILE *loop_dump_stream;
 592
 593 /* Forward declarations.  */
 594
 595 static void invalidate_loops_containing_label (rtx);
 596 static void find_and_verify_loops (rtx, struct loops *);
 597 static void mark_loop_jump (rtx, struct loop *);
 598 static void prescan_loop (struct loop *);
 599 static int reg_in_basic_block_p (rtx, rtx);
 600 static int consec_sets_invariant_p (const struct loop *, rtx, int, rtx);
 601 static int labels_in_range_p (rtx, int);
 602 static void count_one_set (struct loop_regs *, rtx, rtx, rtx *);
 603 static void note_addr_stored (rtx, rtx, void *);
 604 static void note_set_pseudo_multiple_uses (rtx, rtx, void *);
 605 static int loop_reg_used_before_p (const struct loop *, rtx, rtx);
 606 static rtx find_regs_nested (rtx, rtx);
 607 static void scan_loop (struct loop*, int);
 608 #if 0
 609 static void replace_call_address (rtx, rtx, rtx);
 610 #endif
 611 static rtx skip_consec_insns (rtx, int);
 612 static int libcall_benefit (rtx);
 613 static rtx libcall_other_reg (rtx, rtx);
 614 static void record_excess_regs (rtx, rtx, rtx *);
 615 static void ignore_some_movables (struct loop_movables *);
 616 static void force_movables (struct loop_movables *);
 617 static void combine_movables (struct loop_movables *, struct loop_regs *);
 618 static int num_unmoved_movables (const struct loop *);
 619 static int regs_match_p (rtx, rtx, struct loop_movables *);
 620 static int rtx_equal_for_loop_p (rtx, rtx, struct loop_movables *,
 621                                  struct loop_regs *);
 622 static void add_label_notes (rtx, rtx);
 623 static void move_movables (struct loop *loop, struct loop_movables *, int,
 624                            int);
 625 static void loop_movables_add (struct loop_movables *, struct movable *);
 626 static void loop_movables_free (struct loop_movables *);
 627 static int count_nonfixed_reads (const struct loop *, rtx);
 628 static void loop_bivs_find (struct loop *);
 629 static void loop_bivs_init_find (struct loop *);
 630 static void loop_bivs_check (struct loop *);
 631 static void loop_givs_find (struct loop *);
 632 static void loop_givs_check (struct loop *);
 633 static int loop_biv_eliminable_p (struct loop *, struct iv_class *, int, int);
 634 static int loop_giv_reduce_benefit (struct loop *, struct iv_class *,
 635                                     struct induction *, rtx);
 636 static void loop_givs_dead_check (struct loop *, struct iv_class *);
 637 static void loop_givs_reduce (struct loop *, struct iv_class *);
 638 static void loop_givs_rescan (struct loop *, struct iv_class *, rtx *);
 639 static void loop_ivs_free (struct loop *);
 640 static void strength_reduce (struct loop *, int);
 641 static void find_single_use_in_loop (struct loop_regs *, rtx, rtx);
 642 static int valid_initial_value_p (rtx, rtx, int, rtx);
 643 static void find_mem_givs (const struct loop *, rtx, rtx, int, int);
 644 static void record_biv (struct loop *, struct induction *, rtx, rtx, rtx,
 645                         rtx, rtx *, int, int);
 646 static void check_final_value (const struct loop *, struct induction *);
 647 static void loop_ivs_dump (const struct loop *, FILE *, int);
 648 static void loop_iv_class_dump (const struct iv_class *, FILE *, int);
 649 static void loop_biv_dump (const struct induction *, FILE *, int);
 650 static void loop_giv_dump (const struct induction *, FILE *, int);
 651 static void record_giv (const struct loop *, struct induction *, rtx, rtx,
 652                         rtx, rtx, rtx, rtx, int, enum g_types, int, int,
 653                         rtx *);
 654 static void update_giv_derive (const struct loop *, rtx);
 655 static HOST_WIDE_INT get_monotonic_increment (struct iv_class *);
 656 static bool biased_biv_fits_mode_p (const struct loop *, struct iv_class *,
 657                                     HOST_WIDE_INT, enum machine_mode,
 658                                     unsigned HOST_WIDE_INT);
 659 static bool biv_fits_mode_p (const struct loop *, struct iv_class *,
 660                              HOST_WIDE_INT, enum machine_mode, bool);
 661 static bool extension_within_bounds_p (const struct loop *, struct iv_class *,
 662                                        HOST_WIDE_INT, rtx);
 663 static void check_ext_dependent_givs (const struct loop *, struct iv_class *);
 664 static int basic_induction_var (const struct loop *, rtx, enum machine_mode,
 665                                 rtx, rtx, rtx *, rtx *, rtx **);
 666 static rtx simplify_giv_expr (const struct loop *, rtx, rtx *, int *);
 667 static int general_induction_var (const struct loop *loop, rtx, rtx *, rtx *,
 668                                   rtx *, rtx *, int, int *, enum machine_mode);
 669 static int consec_sets_giv (const struct loop *, int, rtx, rtx, rtx, rtx *,
 670                             rtx *, rtx *, rtx *);
 671 static int check_dbra_loop (struct loop *, int);
 672 static rtx express_from_1 (rtx, rtx, rtx);
 673 static rtx combine_givs_p (struct induction *, struct induction *);
 674 static int cmp_combine_givs_stats (const void *, const void *);
 675 static void combine_givs (struct loop_regs *, struct iv_class *);
 676 static int product_cheap_p (rtx, rtx);
 677 static int maybe_eliminate_biv (const struct loop *, struct iv_class *, int,
 678                                 int, int);
 679 static int maybe_eliminate_biv_1 (const struct loop *, rtx, rtx,
 680                                   struct iv_class *, int, basic_block, rtx);
 681 static int last_use_this_basic_block (rtx, rtx);
 682 static void record_initial (rtx, rtx, void *);
 683 static void update_reg_last_use (rtx, rtx);
 684 static rtx next_insn_in_loop (const struct loop *, rtx);
 685 static void loop_regs_scan (const struct loop *, int);
 686 static int count_insns_in_loop (const struct loop *);
 687 static int find_mem_in_note_1 (rtx *, void *);
 688 static rtx find_mem_in_note (rtx);
 689 static void load_mems (const struct loop *);
 690 static int insert_loop_mem (rtx *, void *);
 691 static int replace_loop_mem (rtx *, void *);
 692 static void replace_loop_mems (rtx, rtx, rtx, int);
 693 static int replace_loop_reg (rtx *, void *);
 694 static void replace_loop_regs (rtx insn, rtx, rtx);
 695 static void note_reg_stored (rtx, rtx, void *);
 696 static void try_copy_prop (const struct loop *, rtx, unsigned int);
 697 static void try_swap_copy_prop (const struct loop *, rtx, unsigned int);
 698 static rtx check_insn_for_givs (struct loop *, rtx, int, int);
 699 static rtx check_insn_for_bivs (struct loop *, rtx, int, int);
 700 static rtx gen_add_mult (rtx, rtx, rtx, rtx);
 701 static void loop_regs_update (const struct loop *, rtx);
 702 static int iv_add_mult_cost (rtx, rtx, rtx, rtx);
 703 static int loop_invariant_p (const struct loop *, rtx);
 704 static rtx loop_insn_hoist (const struct loop *, rtx);
 705 static void loop_iv_add_mult_emit_before (const struct loop *, rtx, rtx, rtx,
 706                                           rtx, basic_block, rtx);
 707 static rtx loop_insn_emit_before (const struct loop *, basic_block,
 708                                   rtx, rtx);
 709 static int loop_insn_first_p (rtx, rtx);
 710 static rtx get_condition_for_loop (const struct loop *, rtx);
 711 static void loop_iv_add_mult_sink (const struct loop *, rtx, rtx, rtx, rtx);
 712 static void loop_iv_add_mult_hoist (const struct loop *, rtx, rtx, rtx, rtx);
 713 static rtx extend_value_for_giv (struct induction *, rtx);
 714 static rtx loop_insn_sink (const struct loop *, rtx);
 715
 716 static rtx loop_insn_emit_after (const struct loop *, basic_block, rtx, rtx);
 717 static rtx loop_call_insn_emit_before (const struct loop *, basic_block,
 718                                        rtx, rtx);
 719 static rtx loop_call_insn_hoist (const struct loop *, rtx);
 720 static rtx loop_insn_sink_or_swim (const struct loop *, rtx);
 721
 722 static void loop_dump_aux (const struct loop *, FILE *, int);
 723 static void loop_delete_insns (rtx, rtx);
 724 static HOST_WIDE_INT remove_constant_addition (rtx *);
 725 static rtx gen_load_of_final_value (rtx, rtx);
 726 void debug_ivs (const struct loop *);
 727 void debug_iv_class (const struct iv_class *);
 728 void debug_biv (const struct induction *);
 729 void debug_giv (const struct induction *);
 730 void debug_loop (const struct loop *);
 731 void debug_loops (const struct loops *);
 732
 733 typedef struct loop_replace_args
 734 {
 735   rtx match;
 736   rtx replacement;
 737   rtx insn;
 738 } loop_replace_args;
 739
 740 /* Nonzero iff INSN is between START and END, inclusive.  */
 741 #define INSN_IN_RANGE_P(INSN, START, END)       \
 742   (INSN_UID (INSN) < max_uid_for_loop           \
 743    && INSN_LUID (INSN) >= INSN_LUID (START)     \
 744    && INSN_LUID (INSN) <= INSN_LUID (END))
 745
 746 /* Indirect_jump_in_function is computed once per function.  */
 747 static int indirect_jump_in_function;
 748 static int indirect_jump_in_function_p (rtx);
 749
 750 static int compute_luids (rtx, rtx, int);
 751
 752 static int biv_elimination_giv_has_0_offset (struct induction *,
 753                                              struct induction *, rtx);
 754 \f
 755 /* Benefit penalty, if a giv is not replaceable, i.e. must emit an insn to
 756    copy the value of the strength reduced giv to its original register.  */
 757 static int copy_cost;
 758
 759 /* Cost of using a register, to normalize the benefits of a giv.  */
 760 static int reg_address_cost;
 761
 762 void
 763 init_loop (void)
 764 {
 765   rtx reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
 766
 767   reg_address_cost = address_cost (reg, SImode);
 768
 769   copy_cost = COSTS_N_INSNS (1);
 770 }
 771 \f
 772 /* Compute the mapping from uids to luids.
 773    LUIDs are numbers assigned to insns, like uids,
 774    except that luids increase monotonically through the code.
 775    Start at insn START and stop just before END.  Assign LUIDs
 776    starting with PREV_LUID + 1.  Return the last assigned LUID + 1.  */
 777 static int
 778 compute_luids (rtx start, rtx end, int prev_luid)
 779 {
 780   int i;
 781   rtx insn;
 782
 783   for (insn = start, i = prev_luid; insn != end; insn = NEXT_INSN (insn))
 784     {
 785       if (INSN_UID (insn) >= max_uid_for_loop)
 786         continue;
 787       /* Don't assign luids to line-number NOTEs, so that the distance in
 788          luids between two insns is not affected by -g.  */
 789       if (!NOTE_P (insn)
 790           || NOTE_LINE_NUMBER (insn) <= 0)
 791         uid_luid[INSN_UID (insn)] = ++i;
 792       else
 793         /* Give a line number note the same luid as preceding insn.  */
 794         uid_luid[INSN_UID (insn)] = i;
 795     }
 796   return i + 1;
 797 }
 798 \f
 799 /* Entry point of this file.  Perform loop optimization
 800    on the current function.  F is the first insn of the function
 801    and DUMPFILE is a stream for output of a trace of actions taken
 802    (or 0 if none should be output).  */
 803
 804 void
 805 loop_optimize (rtx f, FILE *dumpfile, int flags)
 806 {
 807   rtx insn;
 808   int i;
 809   struct loops loops_data;
 810   struct loops *loops = &loops_data;
 811   struct loop_info *loops_info;
 812
 813   loop_dump_stream = dumpfile;
 814
 815   init_recog_no_volatile ();
 816
 817   max_reg_before_loop = max_reg_num ();
 818   loop_max_reg = max_reg_before_loop;
 819
 820   regs_may_share = 0;
 821
 822   /* Count the number of loops.  */
 823
 824   max_loop_num = 0;
 825   for (insn = f; insn; insn = NEXT_INSN (insn))
 826     {
 827       if (NOTE_P (insn)
 828           && NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
 829         max_loop_num++;
 830     }
 831
 832   /* Don't waste time if no loops.  */
 833   if (max_loop_num == 0)
 834     return;
 835
 836   loops->num = max_loop_num;
 837
 838   /* Get size to use for tables indexed by uids.
 839      Leave some space for labels allocated by find_and_verify_loops.  */
 840   max_uid_for_loop = get_max_uid () + 1 + max_loop_num * 32;
 841
 842   uid_luid = xcalloc (max_uid_for_loop, sizeof (int));
 843   uid_loop = xcalloc (max_uid_for_loop, sizeof (struct loop *));
 844
 845   /* Allocate storage for array of loops.  */
 846   loops->array = xcalloc (loops->num, sizeof (struct loop));
 847
 848   /* Find and process each loop.
 849      First, find them, and record them in order of their beginnings.  */
 850   find_and_verify_loops (f, loops);
 851
 852   /* Allocate and initialize auxiliary loop information.  */
 853   loops_info = xcalloc (loops->num, sizeof (struct loop_info));
 854   for (i = 0; i < (int) loops->num; i++)
 855     loops->array[i].aux = loops_info + i;
 856
 857   /* Now find all register lifetimes.  This must be done after
 858      find_and_verify_loops, because it might reorder the insns in the
 859      function.  */
 860   reg_scan (f, max_reg_before_loop);
 861
 862   /* This must occur after reg_scan so that registers created by gcse
 863      will have entries in the register tables.
 864
 865      We could have added a call to reg_scan after gcse_main in toplev.c,
 866      but moving this call to init_alias_analysis is more efficient.  */
 867   init_alias_analysis ();
 868
 869   /* See if we went too far.  Note that get_max_uid already returns
 870      one more that the maximum uid of all insn.  */
 871   gcc_assert (get_max_uid () <= max_uid_for_loop);
 872   /* Now reset it to the actual size we need.  See above.  */
 873   max_uid_for_loop = get_max_uid ();
 874
 875   /* find_and_verify_loops has already called compute_luids, but it
 876      might have rearranged code afterwards, so we need to recompute
 877      the luids now.  */
 878   compute_luids (f, NULL_RTX, 0);
 879
 880   /* Don't leave gaps in uid_luid for insns that have been
 881      deleted.  It is possible that the first or last insn
 882      using some register has been deleted by cross-jumping.
 883      Make sure that uid_luid for that former insn's uid
 884      points to the general area where that insn used to be.  */
 885   for (i = 0; i < max_uid_for_loop; i++)
 886     {
 887       uid_luid[0] = uid_luid[i];
 888       if (uid_luid[0] != 0)
 889         break;
 890     }
 891   for (i = 0; i < max_uid_for_loop; i++)
 892     if (uid_luid[i] == 0)
 893       uid_luid[i] = uid_luid[i - 1];
 894
 895   /* Determine if the function has indirect jump.  On some systems
 896      this prevents low overhead loop instructions from being used.  */
 897   indirect_jump_in_function = indirect_jump_in_function_p (f);
 898
 899   /* Now scan the loops, last ones first, since this means inner ones are done
 900      before outer ones.  */
 901   for (i = max_loop_num - 1; i >= 0; i--)
 902     {
 903       struct loop *loop = &loops->array[i];
 904
 905       if (! loop->invalid && loop->end)
 906         {
 907           scan_loop (loop, flags);
 908           ggc_collect ();
 909         }
 910     }
 911
 912   end_alias_analysis ();
 913
 914   /* Clean up.  */
 915   for (i = 0; i < (int) loops->num; i++)
 916     free (loops_info[i].mems);
 917
 918   free (uid_luid);
 919   free (uid_loop);
 920   free (loops_info);
 921   free (loops->array);
 922 }
 923 \f
 924 /* Returns the next insn, in execution order, after INSN.  START and
 925    END are the NOTE_INSN_LOOP_BEG and NOTE_INSN_LOOP_END for the loop,
 926    respectively.  LOOP->TOP, if non-NULL, is the top of the loop in the
 927    insn-stream; it is used with loops that are entered near the
 928    bottom.  */
 929
 930 static rtx
 931 next_insn_in_loop (const struct loop *loop, rtx insn)
 932 {
 933   insn = NEXT_INSN (insn);
 934
 935   if (insn == loop->end)
 936     {
 937       if (loop->top)
 938         /* Go to the top of the loop, and continue there.  */
 939         insn = loop->top;
 940       else
 941         /* We're done.  */
 942         insn = NULL_RTX;
 943     }
 944
 945   if (insn == loop->scan_start)
 946     /* We're done.  */
 947     insn = NULL_RTX;
 948
 949   return insn;
 950 }
 951
 952 /* Find any register references hidden inside X and add them to
 953    the dependency list DEPS.  This is used to look inside CLOBBER (MEM
 954    when checking whether a PARALLEL can be pulled out of a loop.  */
 955
 956 static rtx
 957 find_regs_nested (rtx deps, rtx x)
 958 {
 959   enum rtx_code code = GET_CODE (x);
 960   if (code == REG)
 961     deps = gen_rtx_EXPR_LIST (VOIDmode, x, deps);
 962   else
 963     {
 964       const char *fmt = GET_RTX_FORMAT (code);
 965       int i, j;
 966       for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
 967         {
 968           if (fmt[i] == 'e')
 969             deps = find_regs_nested (deps, XEXP (x, i));
 970           else if (fmt[i] == 'E')
 971             for (j = 0; j < XVECLEN (x, i); j++)
 972               deps = find_regs_nested (deps, XVECEXP (x, i, j));
 973         }
 974     }
 975   return deps;
 976 }
 977
 978 /* Optimize one loop described by LOOP.  */
 979
 980 /* ??? Could also move memory writes out of loops if the destination address
 981    is invariant, the source is invariant, the memory write is not volatile,
 982    and if we can prove that no read inside the loop can read this address
 983    before the write occurs.  If there is a read of this address after the
 984    write, then we can also mark the memory read as invariant.  */
 985
 986 static void
 987 scan_loop (struct loop *loop, int flags)
 988 {
 989   struct loop_info *loop_info = LOOP_INFO (loop);
 990   struct loop_regs *regs = LOOP_REGS (loop);
 991   int i;
 992   rtx loop_start = loop->start;
 993   rtx loop_end = loop->end;
 994   rtx p;
 995   /* 1 if we are scanning insns that could be executed zero times.  */
 996   int maybe_never = 0;
 997   /* 1 if we are scanning insns that might never be executed
 998      due to a subroutine call which might exit before they are reached.  */
 999   int call_passed = 0;
1000   /* Number of insns in the loop.  */
1001   int insn_count;
1002   int tem;
1003   rtx temp, update_start, update_end;
1004   /* The SET from an insn, if it is the only SET in the insn.  */
1005   rtx set, set1;
1006   /* Chain describing insns movable in current loop.  */
1007   struct loop_movables *movables = LOOP_MOVABLES (loop);
1008   /* Ratio of extra register life span we can justify
1009      for saving an instruction.  More if loop doesn't call subroutines
1010      since in that case saving an insn makes more difference
1011      and more registers are available.  */
1012   int threshold;
1013   int in_libcall;
1014
1015   loop->top = 0;
1016
1017   movables->head = 0;
1018   movables->last = 0;
1019
1020   /* Determine whether this loop starts with a jump down to a test at
1021      the end.  This will occur for a small number of loops with a test
1022      that is too complex to duplicate in front of the loop.
1023
1024      We search for the first insn or label in the loop, skipping NOTEs.
1025      However, we must be careful not to skip past a NOTE_INSN_LOOP_BEG
1026      (because we might have a loop executed only once that contains a
1027      loop which starts with a jump to its exit test) or a NOTE_INSN_LOOP_END
1028      (in case we have a degenerate loop).
1029
1030      Note that if we mistakenly think that a loop is entered at the top
1031      when, in fact, it is entered at the exit test, the only effect will be
1032      slightly poorer optimization.  Making the opposite error can generate
1033      incorrect code.  Since very few loops now start with a jump to the
1034      exit test, the code here to detect that case is very conservative.  */
1035
1036   for (p = NEXT_INSN (loop_start);
1037        p != loop_end
1038          && !LABEL_P (p) && ! INSN_P (p)
1039          && (!NOTE_P (p)
1040              || (NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_BEG
1041                  && NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_END));
1042        p = NEXT_INSN (p))
1043     ;
1044
1045   loop->scan_start = p;
1046
1047   /* If loop end is the end of the current function, then emit a
1048      NOTE_INSN_DELETED after loop_end and set loop->sink to the dummy
1049      note insn.  This is the position we use when sinking insns out of
1050      the loop.  */
1051   if (NEXT_INSN (loop->end) != 0)
1052     loop->sink = NEXT_INSN (loop->end);
1053   else
1054     loop->sink = emit_note_after (NOTE_INSN_DELETED, loop->end);
1055
1056   /* Set up variables describing this loop.  */
1057   prescan_loop (loop);
1058   threshold = (loop_info->has_call ? 1 : 2) * (1 + n_non_fixed_regs);
1059
1060   /* If loop has a jump before the first label,
1061      the true entry is the target of that jump.
1062      Start scan from there.
1063      But record in LOOP->TOP the place where the end-test jumps
1064      back to so we can scan that after the end of the loop.  */
1065   if (JUMP_P (p)
1066       /* Loop entry must be unconditional jump (and not a RETURN)  */
1067       && any_uncondjump_p (p)
1068       && JUMP_LABEL (p) != 0
1069       /* Check to see whether the jump actually
1070          jumps out of the loop (meaning it's no loop).
1071          This case can happen for things like
1072          do {..} while (0).  If this label was generated previously
1073          by loop, we can't tell anything about it and have to reject
1074          the loop.  */
1075       && INSN_IN_RANGE_P (JUMP_LABEL (p), loop_start, loop_end))
1076     {
1077       loop->top = next_label (loop->scan_start);
1078       loop->scan_start = JUMP_LABEL (p);
1079     }
1080
1081   /* If LOOP->SCAN_START was an insn created by loop, we don't know its luid
1082      as required by loop_reg_used_before_p.  So skip such loops.  (This
1083      test may never be true, but it's best to play it safe.)
1084
1085      Also, skip loops where we do not start scanning at a label.  This
1086      test also rejects loops starting with a JUMP_INSN that failed the
1087      test above.  */
1088
1089   if (INSN_UID (loop->scan_start) >= max_uid_for_loop
1090       || !LABEL_P (loop->scan_start))
1091     {
1092       if (loop_dump_stream)
1093         fprintf (loop_dump_stream, "\nLoop from %d to %d is phony.\n\n",
1094                  INSN_UID (loop_start), INSN_UID (loop_end));
1095       return;
1096     }
1097
1098   /* Allocate extra space for REGs that might be created by load_mems.
1099      We allocate a little extra slop as well, in the hopes that we
1100      won't have to reallocate the regs array.  */
1101   loop_regs_scan (loop, loop_info->mems_idx + 16);
1102   insn_count = count_insns_in_loop (loop);
1103
1104   if (loop_dump_stream)
1105     fprintf (loop_dump_stream, "\nLoop from %d to %d: %d real insns.\n",
1106              INSN_UID (loop_start), INSN_UID (loop_end), insn_count);
1107
1108   /* Scan through the loop finding insns that are safe to move.
1109      Set REGS->ARRAY[I].SET_IN_LOOP negative for the reg I being set, so that
1110      this reg will be considered invariant for subsequent insns.
1111      We consider whether subsequent insns use the reg
1112      in deciding whether it is worth actually moving.
1113
1114      MAYBE_NEVER is nonzero if we have passed a conditional jump insn
1115      and therefore it is possible that the insns we are scanning
1116      would never be executed.  At such times, we must make sure
1117      that it is safe to execute the insn once instead of zero times.
1118      When MAYBE_NEVER is 0, all insns will be executed at least once
1119      so that is not a problem.  */
1120
1121   for (in_libcall = 0, p = next_insn_in_loop (loop, loop->scan_start);
1122        p != NULL_RTX;
1123        p = next_insn_in_loop (loop, p))
1124     {
1125       if (in_libcall && INSN_P (p) && find_reg_note (p, REG_RETVAL, NULL_RTX))
1126         in_libcall--;
1127       if (NONJUMP_INSN_P (p))
1128         {
1129           /* Do not scan past an optimization barrier.  */
1130           if (GET_CODE (PATTERN (p)) == ASM_INPUT)
1131             break;
1132           temp = find_reg_note (p, REG_LIBCALL, NULL_RTX);
1133           if (temp)
1134             in_libcall++;
1135           if (! in_libcall
1136               && (set = single_set (p))
1137               && REG_P (SET_DEST (set))
1138 #ifdef PIC_OFFSET_TABLE_REG_CALL_CLOBBERED
1139               && SET_DEST (set) != pic_offset_table_rtx
1140 #endif
1141               && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
1142             {
1143               int tem1 = 0;
1144               int tem2 = 0;
1145               int move_insn = 0;
1146               int insert_temp = 0;
1147               rtx src = SET_SRC (set);
1148               rtx dependencies = 0;
1149
1150               /* Figure out what to use as a source of this insn.  If a
1151                  REG_EQUIV note is given or if a REG_EQUAL note with a
1152                  constant operand is specified, use it as the source and
1153                  mark that we should move this insn by calling
1154                  emit_move_insn rather that duplicating the insn.
1155
1156                  Otherwise, only use the REG_EQUAL contents if a REG_RETVAL
1157                  note is present.  */
1158               temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
1159               if (temp)
1160                 src = XEXP (temp, 0), move_insn = 1;
1161               else
1162                 {
1163                   temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
1164                   if (temp && CONSTANT_P (XEXP (temp, 0)))
1165                     src = XEXP (temp, 0), move_insn = 1;
1166                   if (temp && find_reg_note (p, REG_RETVAL, NULL_RTX))
1167                     {
1168                       src = XEXP (temp, 0);
1169                       /* A libcall block can use regs that don't appear in
1170                          the equivalent expression.  To move the libcall,
1171                          we must move those regs too.  */
1172                       dependencies = libcall_other_reg (p, src);
1173                     }
1174                 }
1175
1176               /* For parallels, add any possible uses to the dependencies, as
1177                  we can't move the insn without resolving them first.
1178                  MEMs inside CLOBBERs may also reference registers; these
1179                  count as implicit uses.  */
1180               if (GET_CODE (PATTERN (p)) == PARALLEL)
1181                 {
1182                   for (i = 0; i < XVECLEN (PATTERN (p), 0); i++)
1183                     {
1184                       rtx x = XVECEXP (PATTERN (p), 0, i);
1185                       if (GET_CODE (x) == USE)
1186                         dependencies
1187                           = gen_rtx_EXPR_LIST (VOIDmode, XEXP (x, 0),
1188                                                dependencies);
1189                       else if (GET_CODE (x) == CLOBBER
1190                                && MEM_P (XEXP (x, 0)))
1191                         dependencies = find_regs_nested (dependencies,
1192                                                   XEXP (XEXP (x, 0), 0));
1193                     }
1194                 }
1195
1196               if (/* The register is used in basic blocks other
1197                       than the one where it is set (meaning that
1198                       something after this point in the loop might
1199                       depend on its value before the set).  */
1200                    ! reg_in_basic_block_p (p, SET_DEST (set))
1201                    /* And the set is not guaranteed to be executed once
1202                       the loop starts, or the value before the set is
1203                       needed before the set occurs...
1204
1205                       ??? Note we have quadratic behavior here, mitigated
1206                       by the fact that the previous test will often fail for
1207                       large loops.  Rather than re-scanning the entire loop
1208                       each time for register usage, we should build tables
1209                       of the register usage and use them here instead.  */
1210                    && (maybe_never
1211                        || loop_reg_used_before_p (loop, set, p)))
1212                 /* It is unsafe to move the set.  However, it may be OK to
1213                    move the source into a new pseudo, and substitute a
1214                    reg-to-reg copy for the original insn.
1215
1216                    This code used to consider it OK to move a set of a variable
1217                    which was not created by the user and not used in an exit
1218                    test.
1219                    That behavior is incorrect and was removed.  */
1220                 insert_temp = 1;
1221
1222               /* Don't try to optimize a MODE_CC set with a constant
1223                  source.  It probably will be combined with a conditional
1224                  jump.  */
1225               if (GET_MODE_CLASS (GET_MODE (SET_DEST (set))) == MODE_CC
1226                   && CONSTANT_P (src))
1227                 ;
1228               /* Don't try to optimize a register that was made
1229                  by loop-optimization for an inner loop.
1230                  We don't know its life-span, so we can't compute
1231                  the benefit.  */
1232               else if (REGNO (SET_DEST (set)) >= max_reg_before_loop)
1233                 ;
1234               /* Don't move the source and add a reg-to-reg copy:
1235                  - with -Os (this certainly increases size),
1236                  - if the mode doesn't support copy operations (obviously),
1237                  - if the source is already a reg (the motion will gain nothing),
1238                  - if the source is a legitimate constant (likewise).  */
1239               else if (insert_temp
1240                        && (optimize_size
1241                            || ! can_copy_p (GET_MODE (SET_SRC (set)))
1242                            || REG_P (SET_SRC (set))
1243                            || (CONSTANT_P (SET_SRC (set))
1244                                && LEGITIMATE_CONSTANT_P (SET_SRC (set)))))
1245                 ;
1246               else if ((tem = loop_invariant_p (loop, src))
1247                        && (dependencies == 0
1248                            || (tem2
1249                                = loop_invariant_p (loop, dependencies)) != 0)
1250                        && (regs->array[REGNO (SET_DEST (set))].set_in_loop == 1
1251                            || (tem1
1252                                = consec_sets_invariant_p
1253                                (loop, SET_DEST (set),
1254                                 regs->array[REGNO (SET_DEST (set))].set_in_loop,
1255                                 p)))
1256                        /* If the insn can cause a trap (such as divide by zero),
1257                           can't move it unless it's guaranteed to be executed
1258                           once loop is entered.  Even a function call might
1259                           prevent the trap insn from being reached
1260                           (since it might exit!)  */
1261                        && ! ((maybe_never || call_passed)
1262                              && may_trap_p (src)))
1263                 {
1264                   struct movable *m;
1265                   int regno = REGNO (SET_DEST (set));
1266
1267                   /* A potential lossage is where we have a case where two insns
1268                      can be combined as long as they are both in the loop, but
1269                      we move one of them outside the loop.  For large loops,
1270                      this can lose.  The most common case of this is the address
1271                      of a function being called.
1272
1273                      Therefore, if this register is marked as being used
1274                      exactly once if we are in a loop with calls
1275                      (a "large loop"), see if we can replace the usage of
1276                      this register with the source of this SET.  If we can,
1277                      delete this insn.
1278
1279                      Don't do this if P has a REG_RETVAL note or if we have
1280                      SMALL_REGISTER_CLASSES and SET_SRC is a hard register.  */
1281
1282                   if (loop_info->has_call
1283                       && regs->array[regno].single_usage != 0
1284                       && regs->array[regno].single_usage != const0_rtx
1285                       && REGNO_FIRST_UID (regno) == INSN_UID (p)
1286                       && (REGNO_LAST_UID (regno)
1287                           == INSN_UID (regs->array[regno].single_usage))
1288                       && regs->array[regno].set_in_loop == 1
1289                       && GET_CODE (SET_SRC (set)) != ASM_OPERANDS
1290                       && ! side_effects_p (SET_SRC (set))
1291                       && ! find_reg_note (p, REG_RETVAL, NULL_RTX)
1292                       && (! SMALL_REGISTER_CLASSES
1293                           || (! (REG_P (SET_SRC (set))
1294                                  && (REGNO (SET_SRC (set))
1295                                      < FIRST_PSEUDO_REGISTER))))
1296                       && regno >= FIRST_PSEUDO_REGISTER
1297                       /* This test is not redundant; SET_SRC (set) might be
1298                          a call-clobbered register and the life of REGNO
1299                          might span a call.  */
1300                       && ! modified_between_p (SET_SRC (set), p,
1301                                                regs->array[regno].single_usage)
1302                       && no_labels_between_p (p,
1303                                               regs->array[regno].single_usage)
1304                       && validate_replace_rtx (SET_DEST (set), SET_SRC (set),
1305                                                regs->array[regno].single_usage))
1306                     {
1307                       /* Replace any usage in a REG_EQUAL note.  Must copy
1308                          the new source, so that we don't get rtx sharing
1309                          between the SET_SOURCE and REG_NOTES of insn p.  */
1310                       REG_NOTES (regs->array[regno].single_usage)
1311                         = (replace_rtx
1312                            (REG_NOTES (regs->array[regno].single_usage),
1313                             SET_DEST (set), copy_rtx (SET_SRC (set))));
1314
1315                       delete_insn (p);
1316                       for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
1317                            i++)
1318                         regs->array[regno+i].set_in_loop = 0;
1319                       continue;
1320                     }
1321
1322                   m = xmalloc (sizeof (struct movable));
1323                   m->next = 0;
1324                   m->insn = p;
1325                   m->set_src = src;
1326                   m->dependencies = dependencies;
1327                   m->set_dest = SET_DEST (set);
1328                   m->force = 0;
1329                   m->consec
1330                     = regs->array[REGNO (SET_DEST (set))].set_in_loop - 1;
1331                   m->done = 0;
1332                   m->forces = 0;
1333                   m->partial = 0;
1334                   m->move_insn = move_insn;
1335                   m->move_insn_first = 0;
1336                   m->insert_temp = insert_temp;
1337                   m->is_equiv = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
1338                   m->savemode = VOIDmode;
1339                   m->regno = regno;
1340                   /* Set M->cond if either loop_invariant_p
1341                      or consec_sets_invariant_p returned 2
1342                      (only conditionally invariant).  */
1343                   m->cond = ((tem | tem1 | tem2) > 1);
1344                   m->global =  LOOP_REG_GLOBAL_P (loop, regno);
1345                   m->match = 0;
1346                   m->lifetime = LOOP_REG_LIFETIME (loop, regno);
1347                   m->savings = regs->array[regno].n_times_set;
1348                   if (find_reg_note (p, REG_RETVAL, NULL_RTX))
1349                     m->savings += libcall_benefit (p);
1350                   for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set)); i++)
1351                     regs->array[regno+i].set_in_loop = move_insn ? -2 : -1;
1352                   /* Add M to the end of the chain MOVABLES.  */
1353                   loop_movables_add (movables, m);
1354
1355                   if (m->consec > 0)
1356                     {
1357                       /* It is possible for the first instruction to have a
1358                          REG_EQUAL note but a non-invariant SET_SRC, so we must
1359                          remember the status of the first instruction in case
1360                          the last instruction doesn't have a REG_EQUAL note.  */
1361                       m->move_insn_first = m->move_insn;
1362
1363                       /* Skip this insn, not checking REG_LIBCALL notes.  */
1364                       p = next_nonnote_insn (p);
1365                       /* Skip the consecutive insns, if there are any.  */
1366                       p = skip_consec_insns (p, m->consec);
1367                       /* Back up to the last insn of the consecutive group.  */
1368                       p = prev_nonnote_insn (p);
1369
1370                       /* We must now reset m->move_insn, m->is_equiv, and
1371                          possibly m->set_src to correspond to the effects of
1372                          all the insns.  */
1373                       temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
1374                       if (temp)
1375                         m->set_src = XEXP (temp, 0), m->move_insn = 1;
1376                       else
1377                         {
1378                           temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
1379                           if (temp && CONSTANT_P (XEXP (temp, 0)))
1380                             m->set_src = XEXP (temp, 0), m->move_insn = 1;
1381                           else
1382                             m->move_insn = 0;
1383
1384                         }
1385                       m->is_equiv
1386                         = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
1387                     }
1388                 }
1389               /* If this register is always set within a STRICT_LOW_PART
1390                  or set to zero, then its high bytes are constant.
1391                  So clear them outside the loop and within the loop
1392                  just load the low bytes.
1393                  We must check that the machine has an instruction to do so.
1394                  Also, if the value loaded into the register
1395                  depends on the same register, this cannot be done.  */
1396               else if (SET_SRC (set) == const0_rtx
1397                        && NONJUMP_INSN_P (NEXT_INSN (p))
1398                        && (set1 = single_set (NEXT_INSN (p)))
1399                        && GET_CODE (set1) == SET
1400                        && (GET_CODE (SET_DEST (set1)) == STRICT_LOW_PART)
1401                        && (GET_CODE (XEXP (SET_DEST (set1), 0)) == SUBREG)
1402                        && (SUBREG_REG (XEXP (SET_DEST (set1), 0))
1403                            == SET_DEST (set))
1404                        && !reg_mentioned_p (SET_DEST (set), SET_SRC (set1)))
1405                 {
1406                   int regno = REGNO (SET_DEST (set));
1407                   if (regs->array[regno].set_in_loop == 2)
1408                     {
1409                       struct movable *m;
1410                       m = xmalloc (sizeof (struct movable));
1411                       m->next = 0;
1412                       m->insn = p;
1413                       m->set_dest = SET_DEST (set);
1414                       m->dependencies = 0;
1415                       m->force = 0;
1416                       m->consec = 0;
1417                       m->done = 0;
1418                       m->forces = 0;
1419                       m->move_insn = 0;
1420                       m->move_insn_first = 0;
1421                       m->insert_temp = insert_temp;
1422                       m->partial = 1;
1423                       /* If the insn may not be executed on some cycles,
1424                          we can't clear the whole reg; clear just high part.
1425                          Not even if the reg is used only within this loop.
1426                          Consider this:
1427                          while (1)
1428                            while (s != t) {
1429                              if (foo ()) x = *s;
1430                              use (x);
1431                            }
1432                          Clearing x before the inner loop could clobber a value
1433                          being saved from the last time around the outer loop.
1434                          However, if the reg is not used outside this loop
1435                          and all uses of the register are in the same
1436                          basic block as the store, there is no problem.
1437
1438                          If this insn was made by loop, we don't know its
1439                          INSN_LUID and hence must make a conservative
1440                          assumption.  */
1441                       m->global = (INSN_UID (p) >= max_uid_for_loop
1442                                    || LOOP_REG_GLOBAL_P (loop, regno)
1443                                    || (labels_in_range_p
1444                                        (p, REGNO_FIRST_LUID (regno))));
1445                       if (maybe_never && m->global)
1446                         m->savemode = GET_MODE (SET_SRC (set1));
1447                       else
1448                         m->savemode = VOIDmode;
1449                       m->regno = regno;
1450                       m->cond = 0;
1451                       m->match = 0;
1452                       m->lifetime = LOOP_REG_LIFETIME (loop, regno);
1453                       m->savings = 1;
1454                       for (i = 0;
1455                            i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
1456                            i++)
1457                         regs->array[regno+i].set_in_loop = -1;
1458                       /* Add M to the end of the chain MOVABLES.  */
1459                       loop_movables_add (movables, m);
1460                     }
1461                 }
1462             }
1463         }
1464       /* Past a call insn, we get to insns which might not be executed
1465          because the call might exit.  This matters for insns that trap.
1466          Constant and pure call insns always return, so they don't count.  */
1467       else if (CALL_P (p) && ! CONST_OR_PURE_CALL_P (p))
1468         call_passed = 1;
1469       /* Past a label or a jump, we get to insns for which we
1470          can't count on whether or how many times they will be
1471          executed during each iteration.  Therefore, we can
1472          only move out sets of trivial variables
1473          (those not used after the loop).  */
1474       /* Similar code appears twice in strength_reduce.  */
1475       else if ((LABEL_P (p) || JUMP_P (p))
1476                /* If we enter the loop in the middle, and scan around to the
1477                   beginning, don't set maybe_never for that.  This must be an
1478                   unconditional jump, otherwise the code at the top of the
1479                   loop might never be executed.  Unconditional jumps are
1480                   followed by a barrier then the loop_end.  */
1481                && ! (JUMP_P (p) && JUMP_LABEL (p) == loop->top
1482                      && NEXT_INSN (NEXT_INSN (p)) == loop_end
1483                      && any_uncondjump_p (p)))
1484         maybe_never = 1;
1485     }
1486
1487   /* If one movable subsumes another, ignore that other.  */
1488
1489   ignore_some_movables (movables);
1490
1491   /* For each movable insn, see if the reg that it loads
1492      leads when it dies right into another conditionally movable insn.
1493      If so, record that the second insn "forces" the first one,
1494      since the second can be moved only if the first is.  */
1495
1496   force_movables (movables);
1497
1498   /* See if there are multiple movable insns that load the same value.
1499      If there are, make all but the first point at the first one
1500      through the `match' field, and add the priorities of them
1501      all together as the priority of the first.  */
1502
1503   combine_movables (movables, regs);
1504
1505   /* Now consider each movable insn to decide whether it is worth moving.
1506      Store 0 in regs->array[I].set_in_loop for each reg I that is moved.
1507
1508      For machines with few registers this increases code size, so do not
1509      move moveables when optimizing for code size on such machines.
1510      (The 18 below is the value for i386.)  */
1511
1512   if (!optimize_size
1513       || (reg_class_size[GENERAL_REGS] > 18 && !loop_info->has_call))
1514     {
1515       move_movables (loop, movables, threshold, insn_count);
1516
1517       /* Recalculate regs->array if move_movables has created new
1518          registers.  */
1519       if (max_reg_num () > regs->num)
1520         {
1521           loop_regs_scan (loop, 0);
1522           for (update_start = loop_start;
1523                PREV_INSN (update_start)
1524                && !LABEL_P (PREV_INSN (update_start));
1525                update_start = PREV_INSN (update_start))
1526             ;
1527           update_end = NEXT_INSN (loop_end);
1528
1529           reg_scan_update (update_start, update_end, loop_max_reg);
1530           loop_max_reg = max_reg_num ();
1531         }
1532     }
1533
1534   /* Now candidates that still are negative are those not moved.
1535      Change regs->array[I].set_in_loop to indicate that those are not actually
1536      invariant.  */
1537   for (i = 0; i < regs->num; i++)
1538     if (regs->array[i].set_in_loop < 0)
1539       regs->array[i].set_in_loop = regs->array[i].n_times_set;
1540
1541   /* Now that we've moved some things out of the loop, we might be able to
1542      hoist even more memory references.  */
1543   load_mems (loop);
1544
1545   /* Recalculate regs->array if load_mems has created new registers.  */
1546   if (max_reg_num () > regs->num)
1547     loop_regs_scan (loop, 0);
1548
1549   for (update_start = loop_start;
1550        PREV_INSN (update_start)
1551          && !LABEL_P (PREV_INSN (update_start));
1552        update_start = PREV_INSN (update_start))
1553     ;
1554   update_end = NEXT_INSN (loop_end);
1555
1556   reg_scan_update (update_start, update_end, loop_max_reg);
1557   loop_max_reg = max_reg_num ();
1558
1559   if (flag_strength_reduce)
1560     {
1561       if (update_end && LABEL_P (update_end))
1562         /* Ensure our label doesn't go away.  */
1563         LABEL_NUSES (update_end)++;
1564
1565       strength_reduce (loop, flags);
1566
1567       reg_scan_update (update_start, update_end, loop_max_reg);
1568       loop_max_reg = max_reg_num ();
1569
1570       if (update_end && LABEL_P (update_end)
1571           && --LABEL_NUSES (update_end) == 0)
1572         delete_related_insns (update_end);
1573     }
1574
1575
1576   /* The movable information is required for strength reduction.  */
1577   loop_movables_free (movables);
1578
1579   free (regs->array);
1580   regs->array = 0;
1581   regs->num = 0;
1582 }
1583 \f
1584 /* Add elements to *OUTPUT to record all the pseudo-regs
1585    mentioned in IN_THIS but not mentioned in NOT_IN_THIS.  */
1586
1587 static void
1588 record_excess_regs (rtx in_this, rtx not_in_this, rtx *output)
1589 {
1590   enum rtx_code code;
1591   const char *fmt;
1592   int i;
1593
1594   code = GET_CODE (in_this);
1595
1596   switch (code)
1597     {
1598     case PC:
1599     case CC0:
1600     case CONST_INT:
1601     case CONST_DOUBLE:
1602     case CONST:
1603     case SYMBOL_REF:
1604     case LABEL_REF:
1605       return;
1606
1607     case REG:
1608       if (REGNO (in_this) >= FIRST_PSEUDO_REGISTER
1609           && ! reg_mentioned_p (in_this, not_in_this))
1610         *output = gen_rtx_EXPR_LIST (VOIDmode, in_this, *output);
1611       return;
1612
1613     default:
1614       break;
1615     }
1616
1617   fmt = GET_RTX_FORMAT (code);
1618   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1619     {
1620       int j;
1621
1622       switch (fmt[i])
1623         {
1624         case 'E':
1625           for (j = 0; j < XVECLEN (in_this, i); j++)
1626             record_excess_regs (XVECEXP (in_this, i, j), not_in_this, output);
1627           break;
1628
1629         case 'e':
1630           record_excess_regs (XEXP (in_this, i), not_in_this, output);
1631           break;
1632         }
1633     }
1634 }
1635 \f
1636 /* Check what regs are referred to in the libcall block ending with INSN,
1637    aside from those mentioned in the equivalent value.
1638    If there are none, return 0.
1639    If there are one or more, return an EXPR_LIST containing all of them.  */
1640
1641 static rtx
1642 libcall_other_reg (rtx insn, rtx equiv)
1643 {
1644   rtx note = find_reg_note (insn, REG_RETVAL, NULL_RTX);
1645   rtx p = XEXP (note, 0);
1646   rtx output = 0;
1647
1648   /* First, find all the regs used in the libcall block
1649      that are not mentioned as inputs to the result.  */
1650
1651   while (p != insn)
1652     {
1653       if (INSN_P (p))
1654         record_excess_regs (PATTERN (p), equiv, &output);
1655       p = NEXT_INSN (p);
1656     }
1657
1658   return output;
1659 }
1660 \f
1661 /* Return 1 if all uses of REG
1662    are between INSN and the end of the basic block.  */
1663
1664 static int
1665 reg_in_basic_block_p (rtx insn, rtx reg)
1666 {
1667   int regno = REGNO (reg);
1668   rtx p;
1669
1670   if (REGNO_FIRST_UID (regno) != INSN_UID (insn))
1671     return 0;
1672
1673   /* Search this basic block for the already recorded last use of the reg.  */
1674   for (p = insn; p; p = NEXT_INSN (p))
1675     {
1676       switch (GET_CODE (p))
1677         {
1678         case NOTE:
1679           break;
1680
1681         case INSN:
1682         case CALL_INSN:
1683           /* Ordinary insn: if this is the last use, we win.  */
1684           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1685             return 1;
1686           break;
1687
1688         case JUMP_INSN:
1689           /* Jump insn: if this is the last use, we win.  */
1690           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1691             return 1;
1692           /* Otherwise, it's the end of the basic block, so we lose.  */
1693           return 0;
1694
1695         case CODE_LABEL:
1696         case BARRIER:
1697           /* It's the end of the basic block, so we lose.  */
1698           return 0;
1699
1700         default:
1701           break;
1702         }
1703     }
1704
1705   /* The "last use" that was recorded can't be found after the first
1706      use.  This can happen when the last use was deleted while
1707      processing an inner loop, this inner loop was then completely
1708      unrolled, and the outer loop is always exited after the inner loop,
1709      so that everything after the first use becomes a single basic block.  */
1710   return 1;
1711 }
1712 \f
1713 /* Compute the benefit of eliminating the insns in the block whose
1714    last insn is LAST.  This may be a group of insns used to compute a
1715    value directly or can contain a library call.  */
1716
1717 static int
1718 libcall_benefit (rtx last)
1719 {
1720   rtx insn;
1721   int benefit = 0;
1722
1723   for (insn = XEXP (find_reg_note (last, REG_RETVAL, NULL_RTX), 0);
1724        insn != last; insn = NEXT_INSN (insn))
1725     {
1726       if (CALL_P (insn))
1727         benefit += 10;          /* Assume at least this many insns in a library
1728                                    routine.  */
1729       else if (NONJUMP_INSN_P (insn)
1730                && GET_CODE (PATTERN (insn)) != USE
1731                && GET_CODE (PATTERN (insn)) != CLOBBER)
1732         benefit++;
1733     }
1734
1735   return benefit;
1736 }
1737 \f
1738 /* Skip COUNT insns from INSN, counting library calls as 1 insn.  */
1739
1740 static rtx
1741 skip_consec_insns (rtx insn, int count)
1742 {
1743   for (; count > 0; count--)
1744     {
1745       rtx temp;
1746
1747       /* If first insn of libcall sequence, skip to end.  */
1748       /* Do this at start of loop, since INSN is guaranteed to
1749          be an insn here.  */
1750       if (!NOTE_P (insn)
1751           && (temp = find_reg_note (insn, REG_LIBCALL, NULL_RTX)))
1752         insn = XEXP (temp, 0);
1753
1754       do
1755         insn = NEXT_INSN (insn);
1756       while (NOTE_P (insn));
1757     }
1758
1759   return insn;
1760 }
1761
1762 /* Ignore any movable whose insn falls within a libcall
1763    which is part of another movable.
1764    We make use of the fact that the movable for the libcall value
1765    was made later and so appears later on the chain.  */
1766
1767 static void
1768 ignore_some_movables (struct loop_movables *movables)
1769 {
1770   struct movable *m, *m1;
1771
1772   for (m = movables->head; m; m = m->next)
1773     {
1774       /* Is this a movable for the value of a libcall?  */
1775       rtx note = find_reg_note (m->insn, REG_RETVAL, NULL_RTX);
1776       if (note)
1777         {
1778           rtx insn;
1779           /* Check for earlier movables inside that range,
1780              and mark them invalid.  We cannot use LUIDs here because
1781              insns created by loop.c for prior loops don't have LUIDs.
1782              Rather than reject all such insns from movables, we just
1783              explicitly check each insn in the libcall (since invariant
1784              libcalls aren't that common).  */
1785           for (insn = XEXP (note, 0); insn != m->insn; insn = NEXT_INSN (insn))
1786             for (m1 = movables->head; m1 != m; m1 = m1->next)
1787               if (m1->insn == insn)
1788                 m1->done = 1;
1789         }
1790     }
1791 }
1792
1793 /* For each movable insn, see if the reg that it loads
1794    leads when it dies right into another conditionally movable insn.
1795    If so, record that the second insn "forces" the first one,
1796    since the second can be moved only if the first is.  */
1797
1798 static void
1799 force_movables (struct loop_movables *movables)
1800 {
1801   struct movable *m, *m1;
1802
1803   for (m1 = movables->head; m1; m1 = m1->next)
1804     /* Omit this if moving just the (SET (REG) 0) of a zero-extend.  */
1805     if (!m1->partial && !m1->done)
1806       {
1807         int regno = m1->regno;
1808         for (m = m1->next; m; m = m->next)
1809           /* ??? Could this be a bug?  What if CSE caused the
1810              register of M1 to be used after this insn?
1811              Since CSE does not update regno_last_uid,
1812              this insn M->insn might not be where it dies.
1813              But very likely this doesn't matter; what matters is
1814              that M's reg is computed from M1's reg.  */
1815           if (INSN_UID (m->insn) == REGNO_LAST_UID (regno)
1816               && !m->done)
1817             break;
1818         if (m != 0 && m->set_src == m1->set_dest
1819             /* If m->consec, m->set_src isn't valid.  */
1820             && m->consec == 0)
1821           m = 0;
1822
1823         /* Increase the priority of the moving the first insn
1824            since it permits the second to be moved as well.
1825            Likewise for insns already forced by the first insn.  */
1826         if (m != 0)
1827           {
1828             struct movable *m2;
1829
1830             m->forces = m1;
1831             for (m2 = m1; m2; m2 = m2->forces)
1832               {
1833                 m2->lifetime += m->lifetime;
1834                 m2->savings += m->savings;
1835               }
1836           }
1837       }
1838 }
1839 \f
1840 /* Find invariant expressions that are equal and can be combined into
1841    one register.  */
1842
1843 static void
1844 combine_movables (struct loop_movables *movables, struct loop_regs *regs)
1845 {
1846   struct movable *m;
1847   char *matched_regs = xmalloc (regs->num);
1848   enum machine_mode mode;
1849
1850   /* Regs that are set more than once are not allowed to match
1851      or be matched.  I'm no longer sure why not.  */
1852   /* Only pseudo registers are allowed to match or be matched,
1853      since move_movables does not validate the change.  */
1854   /* Perhaps testing m->consec_sets would be more appropriate here?  */
1855
1856   for (m = movables->head; m; m = m->next)
1857     if (m->match == 0 && regs->array[m->regno].n_times_set == 1
1858         && m->regno >= FIRST_PSEUDO_REGISTER
1859         && !m->insert_temp
1860         && !m->partial)
1861       {
1862         struct movable *m1;
1863         int regno = m->regno;
1864
1865         memset (matched_regs, 0, regs->num);
1866         matched_regs[regno] = 1;
1867
1868         /* We want later insns to match the first one.  Don't make the first
1869            one match any later ones.  So start this loop at m->next.  */
1870         for (m1 = m->next; m1; m1 = m1->next)
1871           if (m != m1 && m1->match == 0
1872               && !m1->insert_temp
1873               && regs->array[m1->regno].n_times_set == 1
1874               && m1->regno >= FIRST_PSEUDO_REGISTER
1875               /* A reg used outside the loop mustn't be eliminated.  */
1876               && !m1->global
1877               /* A reg used for zero-extending mustn't be eliminated.  */
1878               && !m1->partial
1879               && (matched_regs[m1->regno]
1880                   ||
1881                   (
1882                    /* Can combine regs with different modes loaded from the
1883                       same constant only if the modes are the same or
1884                       if both are integer modes with M wider or the same
1885                       width as M1.  The check for integer is redundant, but
1886                       safe, since the only case of differing destination
1887                       modes with equal sources is when both sources are
1888                       VOIDmode, i.e., CONST_INT.  */
1889                    (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest)
1890                     || (GET_MODE_CLASS (GET_MODE (m->set_dest)) == MODE_INT
1891                         && GET_MODE_CLASS (GET_MODE (m1->set_dest)) == MODE_INT
1892                         && (GET_MODE_BITSIZE (GET_MODE (m->set_dest))
1893                             >= GET_MODE_BITSIZE (GET_MODE (m1->set_dest)))))
1894                    /* See if the source of M1 says it matches M.  */
1895                    && ((REG_P (m1->set_src)
1896                         && matched_regs[REGNO (m1->set_src)])
1897                        || rtx_equal_for_loop_p (m->set_src, m1->set_src,
1898                                                 movables, regs))))
1899               && ((m->dependencies == m1->dependencies)
1900                   || rtx_equal_p (m->dependencies, m1->dependencies)))
1901             {
1902               m->lifetime += m1->lifetime;
1903               m->savings += m1->savings;
1904               m1->done = 1;
1905               m1->match = m;
1906               matched_regs[m1->regno] = 1;
1907             }
1908       }
1909
1910   /* Now combine the regs used for zero-extension.
1911      This can be done for those not marked `global'
1912      provided their lives don't overlap.  */
1913
1914   for (mode = GET_CLASS_NARROWEST_MODE (MODE_INT); mode != VOIDmode;
1915        mode = GET_MODE_WIDER_MODE (mode))
1916     {
1917       struct movable *m0 = 0;
1918
1919       /* Combine all the registers for extension from mode MODE.
1920          Don't combine any that are used outside this loop.  */
1921       for (m = movables->head; m; m = m->next)
1922         if (m->partial && ! m->global
1923             && mode == GET_MODE (SET_SRC (PATTERN (NEXT_INSN (m->insn)))))
1924           {
1925             struct movable *m1;
1926
1927             int first = REGNO_FIRST_LUID (m->regno);
1928             int last = REGNO_LAST_LUID (m->regno);
1929
1930             if (m0 == 0)
1931               {
1932                 /* First one: don't check for overlap, just record it.  */
1933                 m0 = m;
1934                 continue;
1935               }
1936
1937             /* Make sure they extend to the same mode.
1938                (Almost always true.)  */
1939             if (GET_MODE (m->set_dest) != GET_MODE (m0->set_dest))
1940               continue;
1941
1942             /* We already have one: check for overlap with those
1943                already combined together.  */
1944             for (m1 = movables->head; m1 != m; m1 = m1->next)
1945               if (m1 == m0 || (m1->partial && m1->match == m0))
1946                 if (! (REGNO_FIRST_LUID (m1->regno) > last
1947                        || REGNO_LAST_LUID (m1->regno) < first))
1948                   goto overlap;
1949
1950             /* No overlap: we can combine this with the others.  */
1951             m0->lifetime += m->lifetime;
1952             m0->savings += m->savings;
1953             m->done = 1;
1954             m->match = m0;
1955
1956           overlap:
1957             ;
1958           }
1959     }
1960
1961   /* Clean up.  */
1962   free (matched_regs);
1963 }
1964
1965 /* Returns the number of movable instructions in LOOP that were not
1966    moved outside the loop.  */
1967
1968 static int
1969 num_unmoved_movables (const struct loop *loop)
1970 {
1971   int num = 0;
1972   struct movable *m;
1973
1974   for (m = LOOP_MOVABLES (loop)->head; m; m = m->next)
1975     if (!m->done)
1976       ++num;
1977
1978   return num;
1979 }
1980
1981 \f
1982 /* Return 1 if regs X and Y will become the same if moved.  */
1983
1984 static int
1985 regs_match_p (rtx x, rtx y, struct loop_movables *movables)
1986 {
1987   unsigned int xn = REGNO (x);
1988   unsigned int yn = REGNO (y);
1989   struct movable *mx, *my;
1990
1991   for (mx = movables->head; mx; mx = mx->next)
1992     if (mx->regno == xn)
1993       break;
1994
1995   for (my = movables->head; my; my = my->next)
1996     if (my->regno == yn)
1997       break;
1998
1999   return (mx && my
2000           && ((mx->match == my->match && mx->match != 0)
2001               || mx->match == my
2002               || mx == my->match));
2003 }
2004
2005 /* Return 1 if X and Y are identical-looking rtx's.
2006    This is the Lisp function EQUAL for rtx arguments.
2007
2008    If two registers are matching movables or a movable register and an
2009    equivalent constant, consider them equal.  */
2010
2011 static int
2012 rtx_equal_for_loop_p (rtx x, rtx y, struct loop_movables *movables,
2013                       struct loop_regs *regs)
2014 {
2015   int i;
2016   int j;
2017   struct movable *m;
2018   enum rtx_code code;
2019   const char *fmt;
2020
2021   if (x == y)
2022     return 1;
2023   if (x == 0 || y == 0)
2024     return 0;
2025
2026   code = GET_CODE (x);
2027
2028   /* If we have a register and a constant, they may sometimes be
2029      equal.  */
2030   if (REG_P (x) && regs->array[REGNO (x)].set_in_loop == -2
2031       && CONSTANT_P (y))
2032     {
2033       for (m = movables->head; m; m = m->next)
2034         if (m->move_insn && m->regno == REGNO (x)
2035             && rtx_equal_p (m->set_src, y))
2036           return 1;
2037     }
2038   else if (REG_P (y) && regs->array[REGNO (y)].set_in_loop == -2
2039            && CONSTANT_P (x))
2040     {
2041       for (m = movables->head; m; m = m->next)
2042         if (m->move_insn && m->regno == REGNO (y)
2043             && rtx_equal_p (m->set_src, x))
2044           return 1;
2045     }
2046
2047   /* Otherwise, rtx's of different codes cannot be equal.  */
2048   if (code != GET_CODE (y))
2049     return 0;
2050
2051   /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.
2052      (REG:SI x) and (REG:HI x) are NOT equivalent.  */
2053
2054   if (GET_MODE (x) != GET_MODE (y))
2055     return 0;
2056
2057   /* These three types of rtx's can be compared nonrecursively.  */
2058   if (code == REG)
2059     return (REGNO (x) == REGNO (y) || regs_match_p (x, y, movables));
2060
2061   if (code == LABEL_REF)
2062     return XEXP (x, 0) == XEXP (y, 0);
2063   if (code == SYMBOL_REF)
2064     return XSTR (x, 0) == XSTR (y, 0);
2065
2066   /* Compare the elements.  If any pair of corresponding elements
2067      fail to match, return 0 for the whole things.  */
2068
2069   fmt = GET_RTX_FORMAT (code);
2070   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2071     {
2072       switch (fmt[i])
2073         {
2074         case 'w':
2075           if (XWINT (x, i) != XWINT (y, i))
2076             return 0;
2077           break;
2078
2079         case 'i':
2080           if (XINT (x, i) != XINT (y, i))
2081             return 0;
2082           break;
2083
2084         case 'E':
2085           /* Two vectors must have the same length.  */
2086           if (XVECLEN (x, i) != XVECLEN (y, i))
2087             return 0;
2088
2089           /* And the corresponding elements must match.  */
2090           for (j = 0; j < XVECLEN (x, i); j++)
2091             if (rtx_equal_for_loop_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
2092                                       movables, regs) == 0)
2093               return 0;
2094           break;
2095
2096         case 'e':
2097           if (rtx_equal_for_loop_p (XEXP (x, i), XEXP (y, i), movables, regs)
2098               == 0)
2099             return 0;
2100           break;
2101
2102         case 's':
2103           if (strcmp (XSTR (x, i), XSTR (y, i)))
2104             return 0;
2105           break;
2106
2107         case 'u':
2108           /* These are just backpointers, so they don't matter.  */
2109           break;
2110
2111         case '0':
2112           break;
2113
2114           /* It is believed that rtx's at this level will never
2115              contain anything but integers and other rtx's,
2116              except for within LABEL_REFs and SYMBOL_REFs.  */
2117         default:
2118           gcc_unreachable ();
2119         }
2120     }
2121   return 1;
2122 }
2123 \f
2124 /* If X contains any LABEL_REF's, add REG_LABEL notes for them to all
2125    insns in INSNS which use the reference.  LABEL_NUSES for CODE_LABEL
2126    references is incremented once for each added note.  */
2127
2128 static void
2129 add_label_notes (rtx x, rtx insns)
2130 {
2131   enum rtx_code code = GET_CODE (x);
2132   int i, j;
2133   const char *fmt;
2134   rtx insn;
2135
2136   if (code == LABEL_REF && !LABEL_REF_NONLOCAL_P (x))
2137     {
2138       /* This code used to ignore labels that referred to dispatch tables to
2139          avoid flow generating (slightly) worse code.
2140
2141          We no longer ignore such label references (see LABEL_REF handling in
2142          mark_jump_label for additional information).  */
2143       for (insn = insns; insn; insn = NEXT_INSN (insn))
2144         if (reg_mentioned_p (XEXP (x, 0), insn))
2145           {
2146             REG_NOTES (insn) = gen_rtx_INSN_LIST (REG_LABEL, XEXP (x, 0),
2147                                                   REG_NOTES (insn));
2148             if (LABEL_P (XEXP (x, 0)))
2149               LABEL_NUSES (XEXP (x, 0))++;
2150           }
2151     }
2152
2153   fmt = GET_RTX_FORMAT (code);
2154   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2155     {
2156       if (fmt[i] == 'e')
2157         add_label_notes (XEXP (x, i), insns);
2158       else if (fmt[i] == 'E')
2159         for (j = XVECLEN (x, i) - 1; j >= 0; j--)
2160           add_label_notes (XVECEXP (x, i, j), insns);
2161     }
2162 }
2163 \f
2164 /* Scan MOVABLES, and move the insns that deserve to be moved.
2165    If two matching movables are combined, replace one reg with the
2166    other throughout.  */
2167
2168 static void
2169 move_movables (struct loop *loop, struct loop_movables *movables,
2170                int threshold, int insn_count)
2171 {
2172   struct loop_regs *regs = LOOP_REGS (loop);
2173   int nregs = regs->num;
2174   rtx new_start = 0;
2175   struct movable *m;
2176   rtx p;
2177   rtx loop_start = loop->start;
2178   rtx loop_end = loop->end;
2179   /* Map of pseudo-register replacements to handle combining
2180      when we move several insns that load the same value
2181      into different pseudo-registers.  */
2182   rtx *reg_map = xcalloc (nregs, sizeof (rtx));
2183   char *already_moved = xcalloc (nregs, sizeof (char));
2184
2185   for (m = movables->head; m; m = m->next)
2186     {
2187       /* Describe this movable insn.  */
2188
2189       if (loop_dump_stream)
2190         {
2191           fprintf (loop_dump_stream, "Insn %d: regno %d (life %d), ",
2192                    INSN_UID (m->insn), m->regno, m->lifetime);
2193           if (m->consec > 0)
2194             fprintf (loop_dump_stream, "consec %d, ", m->consec);
2195           if (m->cond)
2196             fprintf (loop_dump_stream, "cond ");
2197           if (m->force)
2198             fprintf (loop_dump_stream, "force ");
2199           if (m->global)
2200             fprintf (loop_dump_stream, "global ");
2201           if (m->done)
2202             fprintf (loop_dump_stream, "done ");
2203           if (m->move_insn)
2204             fprintf (loop_dump_stream, "move-insn ");
2205           if (m->match)
2206             fprintf (loop_dump_stream, "matches %d ",
2207                      INSN_UID (m->match->insn));
2208           if (m->forces)
2209             fprintf (loop_dump_stream, "forces %d ",
2210                      INSN_UID (m->forces->insn));
2211         }
2212
2213       /* Ignore the insn if it's already done (it matched something else).
2214          Otherwise, see if it is now safe to move.  */
2215
2216       if (!m->done
2217           && (! m->cond
2218               || (1 == loop_invariant_p (loop, m->set_src)
2219                   && (m->dependencies == 0
2220                       || 1 == loop_invariant_p (loop, m->dependencies))
2221                   && (m->consec == 0
2222                       || 1 == consec_sets_invariant_p (loop, m->set_dest,
2223                                                        m->consec + 1,
2224                                                        m->insn))))
2225           && (! m->forces || m->forces->done))
2226         {
2227           int regno;
2228           rtx p;
2229           int savings = m->savings;
2230
2231           /* We have an insn that is safe to move.
2232              Compute its desirability.  */
2233
2234           p = m->insn;
2235           regno = m->regno;
2236
2237           if (loop_dump_stream)
2238             fprintf (loop_dump_stream, "savings %d ", savings);
2239
2240           if (regs->array[regno].moved_once && loop_dump_stream)
2241             fprintf (loop_dump_stream, "halved since already moved ");
2242
2243           /* An insn MUST be moved if we already moved something else
2244              which is safe only if this one is moved too: that is,
2245              if already_moved[REGNO] is nonzero.  */
2246
2247           /* An insn is desirable to move if the new lifetime of the
2248              register is no more than THRESHOLD times the old lifetime.
2249              If it's not desirable, it means the loop is so big
2250              that moving won't speed things up much,
2251              and it is liable to make register usage worse.  */
2252
2253           /* It is also desirable to move if it can be moved at no
2254              extra cost because something else was already moved.  */
2255
2256           if (already_moved[regno]
2257               || (threshold * savings * m->lifetime) >=
2258                  (regs->array[regno].moved_once ? insn_count * 2 : insn_count)
2259               || (m->forces && m->forces->done
2260                   && regs->array[m->forces->regno].n_times_set == 1))
2261             {
2262               int count;
2263               struct movable *m1;
2264               rtx first = NULL_RTX;
2265               rtx newreg = NULL_RTX;
2266
2267               if (m->insert_temp)
2268                 newreg = gen_reg_rtx (GET_MODE (m->set_dest));
2269
2270               /* Now move the insns that set the reg.  */
2271
2272               if (m->partial && m->match)
2273                 {
2274                   rtx newpat, i1;
2275                   rtx r1, r2;
2276                   /* Find the end of this chain of matching regs.
2277                      Thus, we load each reg in the chain from that one reg.
2278                      And that reg is loaded with 0 directly,
2279                      since it has ->match == 0.  */
2280                   for (m1 = m; m1->match; m1 = m1->match);
2281                   newpat = gen_move_insn (SET_DEST (PATTERN (m->insn)),
2282                                           SET_DEST (PATTERN (m1->insn)));
2283                   i1 = loop_insn_hoist (loop, newpat);
2284
2285                   /* Mark the moved, invariant reg as being allowed to
2286                      share a hard reg with the other matching invariant.  */
2287                   REG_NOTES (i1) = REG_NOTES (m->insn);
2288                   r1 = SET_DEST (PATTERN (m->insn));
2289                   r2 = SET_DEST (PATTERN (m1->insn));
2290                   regs_may_share
2291                     = gen_rtx_EXPR_LIST (VOIDmode, r1,
2292                                          gen_rtx_EXPR_LIST (VOIDmode, r2,
2293                                                             regs_may_share));
2294                   delete_insn (m->insn);
2295
2296                   if (new_start == 0)
2297                     new_start = i1;
2298
2299                   if (loop_dump_stream)
2300                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
2301                 }
2302               /* If we are to re-generate the item being moved with a
2303                  new move insn, first delete what we have and then emit
2304                  the move insn before the loop.  */
2305               else if (m->move_insn)
2306                 {
2307                   rtx i1, temp, seq;
2308
2309                   for (count = m->consec; count >= 0; count--)
2310                     {
2311                       if (!NOTE_P (p))
2312                         {
2313                           /* If this is the first insn of a library
2314                              call sequence, something is very
2315                              wrong.  */
2316                           gcc_assert (!find_reg_note
2317                                       (p, REG_LIBCALL, NULL_RTX));
2318
2319                           /* If this is the last insn of a libcall
2320                              sequence, then delete every insn in the
2321                              sequence except the last.  The last insn
2322                              is handled in the normal manner.  */
2323                           temp = find_reg_note (p, REG_RETVAL, NULL_RTX);
2324
2325                           if (temp)
2326                             {
2327                               temp = XEXP (temp, 0);
2328                               while (temp != p)
2329                                 temp = delete_insn (temp);
2330                             }
2331                         }
2332
2333                       temp = p;
2334                       p = delete_insn (p);
2335
2336                       /* simplify_giv_expr expects that it can walk the insns
2337                          at m->insn forwards and see this old sequence we are
2338                          tossing here.  delete_insn does preserve the next
2339                          pointers, but when we skip over a NOTE we must fix
2340                          it up.  Otherwise that code walks into the non-deleted
2341                          insn stream.  */
2342                       while (p && NOTE_P (p))
2343                         p = NEXT_INSN (temp) = NEXT_INSN (p);
2344
2345                       if (m->insert_temp)
2346                         {
2347                           /* Replace the original insn with a move from
2348                              our newly created temp.  */
2349                           start_sequence ();
2350                           emit_move_insn (m->set_dest, newreg);
2351                           seq = get_insns ();
2352                           end_sequence ();
2353                           emit_insn_before (seq, p);
2354                         }
2355                     }
2356
2357                   start_sequence ();
2358                   emit_move_insn (m->insert_temp ? newreg : m->set_dest,
2359                                   m->set_src);
2360                   seq = get_insns ();
2361                   end_sequence ();
2362
2363                   add_label_notes (m->set_src, seq);
2364
2365                   i1 = loop_insn_hoist (loop, seq);
2366                   if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2367                     set_unique_reg_note (i1,
2368                                          m->is_equiv ? REG_EQUIV : REG_EQUAL,
2369                                          m->set_src);
2370
2371                   if (loop_dump_stream)
2372                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
2373
2374                   /* The more regs we move, the less we like moving them.  */
2375                   threshold -= 3;
2376                 }
2377               else
2378                 {
2379                   for (count = m->consec; count >= 0; count--)
2380                     {
2381                       rtx i1, temp;
2382
2383                       /* If first insn of libcall sequence, skip to end.  */
2384                       /* Do this at start of loop, since p is guaranteed to
2385                          be an insn here.  */
2386                       if (!NOTE_P (p)
2387                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
2388                         p = XEXP (temp, 0);
2389
2390                       /* If last insn of libcall sequence, move all
2391                          insns except the last before the loop.  The last
2392                          insn is handled in the normal manner.  */
2393                       if (!NOTE_P (p)
2394                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
2395                         {
2396                           rtx fn_address = 0;
2397                           rtx fn_reg = 0;
2398                           rtx fn_address_insn = 0;
2399
2400                           first = 0;
2401                           for (temp = XEXP (temp, 0); temp != p;
2402                                temp = NEXT_INSN (temp))
2403                             {
2404                               rtx body;
2405                               rtx n;
2406                               rtx next;
2407
2408                               if (NOTE_P (temp))
2409                                 continue;
2410
2411                               body = PATTERN (temp);
2412
2413                               /* Find the next insn after TEMP,
2414                                  not counting USE or NOTE insns.  */
2415                               for (next = NEXT_INSN (temp); next != p;
2416                                    next = NEXT_INSN (next))
2417                                 if (! (NONJUMP_INSN_P (next)
2418                                        && GET_CODE (PATTERN (next)) == USE)
2419                                     && !NOTE_P (next))
2420                                   break;
2421
2422                               /* If that is the call, this may be the insn
2423                                  that loads the function address.
2424
2425                                  Extract the function address from the insn
2426                                  that loads it into a register.
2427                                  If this insn was cse'd, we get incorrect code.
2428
2429                                  So emit a new move insn that copies the
2430                                  function address into the register that the
2431                                  call insn will use.  flow.c will delete any
2432                                  redundant stores that we have created.  */
2433                               if (CALL_P (next)
2434                                   && GET_CODE (body) == SET
2435                                   && REG_P (SET_DEST (body))
2436                                   && (n = find_reg_note (temp, REG_EQUAL,
2437                                                          NULL_RTX)))
2438                                 {
2439                                   fn_reg = SET_SRC (body);
2440                                   if (!REG_P (fn_reg))
2441                                     fn_reg = SET_DEST (body);
2442                                   fn_address = XEXP (n, 0);
2443                                   fn_address_insn = temp;
2444                                 }
2445                               /* We have the call insn.
2446                                  If it uses the register we suspect it might,
2447                                  load it with the correct address directly.  */
2448                               if (CALL_P (temp)
2449                                   && fn_address != 0
2450                                   && reg_referenced_p (fn_reg, body))
2451                                 loop_insn_emit_after (loop, 0, fn_address_insn,
2452                                                       gen_move_insn
2453                                                       (fn_reg, fn_address));
2454
2455                               if (CALL_P (temp))
2456                                 {
2457                                   i1 = loop_call_insn_hoist (loop, body);
2458                                   /* Because the USAGE information potentially
2459                                      contains objects other than hard registers
2460                                      we need to copy it.  */
2461                                   if (CALL_INSN_FUNCTION_USAGE (temp))
2462                                     CALL_INSN_FUNCTION_USAGE (i1)
2463                                       = copy_rtx (CALL_INSN_FUNCTION_USAGE (temp));
2464                                 }
2465                               else
2466                                 i1 = loop_insn_hoist (loop, body);
2467                               if (first == 0)
2468                                 first = i1;
2469                               if (temp == fn_address_insn)
2470                                 fn_address_insn = i1;
2471                               REG_NOTES (i1) = REG_NOTES (temp);
2472                               REG_NOTES (temp) = NULL;
2473                               delete_insn (temp);
2474                             }
2475                           if (new_start == 0)
2476                             new_start = first;
2477                         }
2478                       if (m->savemode != VOIDmode)
2479                         {
2480                           /* P sets REG to zero; but we should clear only
2481                              the bits that are not covered by the mode
2482                              m->savemode.  */
2483                           rtx reg = m->set_dest;
2484                           rtx sequence;
2485                           rtx tem;
2486
2487                           start_sequence ();
2488                           tem = expand_simple_binop
2489                             (GET_MODE (reg), AND, reg,
2490                              GEN_INT ((((HOST_WIDE_INT) 1
2491                                         << GET_MODE_BITSIZE (m->savemode)))
2492                                       - 1),
2493                              reg, 1, OPTAB_LIB_WIDEN);
2494                           gcc_assert (tem);
2495                           if (tem != reg)
2496                             emit_move_insn (reg, tem);
2497                           sequence = get_insns ();
2498                           end_sequence ();
2499                           i1 = loop_insn_hoist (loop, sequence);
2500                         }
2501                       else if (CALL_P (p))
2502                         {
2503                           i1 = loop_call_insn_hoist (loop, PATTERN (p));
2504                           /* Because the USAGE information potentially
2505                              contains objects other than hard registers
2506                              we need to copy it.  */
2507                           if (CALL_INSN_FUNCTION_USAGE (p))
2508                             CALL_INSN_FUNCTION_USAGE (i1)
2509                               = copy_rtx (CALL_INSN_FUNCTION_USAGE (p));
2510                         }
2511                       else if (count == m->consec && m->move_insn_first)
2512                         {
2513                           rtx seq;
2514                           /* The SET_SRC might not be invariant, so we must
2515                              use the REG_EQUAL note.  */
2516                           start_sequence ();
2517                           emit_move_insn (m->insert_temp ? newreg : m->set_dest,
2518                                           m->set_src);
2519                           seq = get_insns ();
2520                           end_sequence ();
2521
2522                           add_label_notes (m->set_src, seq);
2523
2524                           i1 = loop_insn_hoist (loop, seq);
2525                           if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2526                             set_unique_reg_note (i1, m->is_equiv ? REG_EQUIV
2527                                                      : REG_EQUAL, m->set_src);
2528                         }
2529                       else if (m->insert_temp)
2530                         {
2531                           rtx *reg_map2 = xcalloc (REGNO (newreg),
2532                                                    sizeof(rtx));
2533                           reg_map2 [m->regno] = newreg;
2534
2535                           i1 = loop_insn_hoist (loop, copy_rtx (PATTERN (p)));
2536                           replace_regs (i1, reg_map2, REGNO (newreg), 1);
2537                           free (reg_map2);
2538                         }
2539                       else
2540                         i1 = loop_insn_hoist (loop, PATTERN (p));
2541
2542                       if (REG_NOTES (i1) == 0)
2543                         {
2544                           REG_NOTES (i1) = REG_NOTES (p);
2545                           REG_NOTES (p) = NULL;
2546
2547                           /* If there is a REG_EQUAL note present whose value
2548                              is not loop invariant, then delete it, since it
2549                              may cause problems with later optimization passes.
2550                              It is possible for cse to create such notes
2551                              like this as a result of record_jump_cond.  */
2552
2553                           if ((temp = find_reg_note (i1, REG_EQUAL, NULL_RTX))
2554                               && ! loop_invariant_p (loop, XEXP (temp, 0)))
2555                             remove_note (i1, temp);
2556                         }
2557
2558                       if (new_start == 0)
2559                         new_start = i1;
2560
2561                       if (loop_dump_stream)
2562                         fprintf (loop_dump_stream, " moved to %d",
2563                                  INSN_UID (i1));
2564
2565                       /* If library call, now fix the REG_NOTES that contain
2566                          insn pointers, namely REG_LIBCALL on FIRST
2567                          and REG_RETVAL on I1.  */
2568                       if ((temp = find_reg_note (i1, REG_RETVAL, NULL_RTX)))
2569                         {
2570                           XEXP (temp, 0) = first;
2571                           temp = find_reg_note (first, REG_LIBCALL, NULL_RTX);
2572                           XEXP (temp, 0) = i1;
2573                         }
2574
2575                       temp = p;
2576                       delete_insn (p);
2577                       p = NEXT_INSN (p);
2578
2579                       /* simplify_giv_expr expects that it can walk the insns
2580                          at m->insn forwards and see this old sequence we are
2581                          tossing here.  delete_insn does preserve the next
2582                          pointers, but when we skip over a NOTE we must fix
2583                          it up.  Otherwise that code walks into the non-deleted
2584                          insn stream.  */
2585                       while (p && NOTE_P (p))
2586                         p = NEXT_INSN (temp) = NEXT_INSN (p);
2587
2588                       if (m->insert_temp)
2589                         {
2590                           rtx seq;
2591                           /* Replace the original insn with a move from
2592                              our newly created temp.  */
2593                           start_sequence ();
2594                           emit_move_insn (m->set_dest, newreg);
2595                           seq = get_insns ();
2596                           end_sequence ();
2597                           emit_insn_before (seq, p);
2598                         }
2599                     }
2600
2601                   /* The more regs we move, the less we like moving them.  */
2602                   threshold -= 3;
2603                 }
2604
2605               m->done = 1;
2606
2607               if (!m->insert_temp)
2608                 {
2609                   /* Any other movable that loads the same register
2610                      MUST be moved.  */
2611                   already_moved[regno] = 1;
2612
2613                   /* This reg has been moved out of one loop.  */
2614                   regs->array[regno].moved_once = 1;
2615
2616                   /* The reg set here is now invariant.  */
2617                   if (! m->partial)
2618                     {
2619                       int i;
2620                       for (i = 0; i < LOOP_REGNO_NREGS (regno, m->set_dest); i++)
2621                         regs->array[regno+i].set_in_loop = 0;
2622                     }
2623
2624                   /* Change the length-of-life info for the register
2625                      to say it lives at least the full length of this loop.
2626                      This will help guide optimizations in outer loops.  */
2627
2628                   if (REGNO_FIRST_LUID (regno) > INSN_LUID (loop_start))
2629                     /* This is the old insn before all the moved insns.
2630                        We can't use the moved insn because it is out of range
2631                        in uid_luid.  Only the old insns have luids.  */
2632                     REGNO_FIRST_UID (regno) = INSN_UID (loop_start);
2633                   if (REGNO_LAST_LUID (regno) < INSN_LUID (loop_end))
2634                     REGNO_LAST_UID (regno) = INSN_UID (loop_end);
2635                 }
2636
2637               /* Combine with this moved insn any other matching movables.  */
2638
2639               if (! m->partial)
2640                 for (m1 = movables->head; m1; m1 = m1->next)
2641                   if (m1->match == m)
2642                     {
2643                       rtx temp;
2644
2645                       /* Schedule the reg loaded by M1
2646                          for replacement so that shares the reg of M.
2647                          If the modes differ (only possible in restricted
2648                          circumstances, make a SUBREG.
2649
2650                          Note this assumes that the target dependent files
2651                          treat REG and SUBREG equally, including within
2652                          GO_IF_LEGITIMATE_ADDRESS and in all the
2653                          predicates since we never verify that replacing the
2654                          original register with a SUBREG results in a
2655                          recognizable insn.  */
2656                       if (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest))
2657                         reg_map[m1->regno] = m->set_dest;
2658                       else
2659                         reg_map[m1->regno]
2660                           = gen_lowpart_common (GET_MODE (m1->set_dest),
2661                                                 m->set_dest);
2662
2663                       /* Get rid of the matching insn
2664                          and prevent further processing of it.  */
2665                       m1->done = 1;
2666
2667                       /* If library call, delete all insns.  */
2668                       if ((temp = find_reg_note (m1->insn, REG_RETVAL,
2669                                                  NULL_RTX)))
2670                         delete_insn_chain (XEXP (temp, 0), m1->insn);
2671                       else
2672                         delete_insn (m1->insn);
2673
2674                       /* Any other movable that loads the same register
2675                          MUST be moved.  */
2676                       already_moved[m1->regno] = 1;
2677
2678                       /* The reg merged here is now invariant,
2679                          if the reg it matches is invariant.  */
2680                       if (! m->partial)
2681                         {
2682                           int i;
2683                           for (i = 0;
2684                                i < LOOP_REGNO_NREGS (regno, m1->set_dest);
2685                                i++)
2686                             regs->array[m1->regno+i].set_in_loop = 0;
2687                         }
2688                     }
2689             }
2690           else if (loop_dump_stream)
2691             fprintf (loop_dump_stream, "not desirable");
2692         }
2693       else if (loop_dump_stream && !m->match)
2694         fprintf (loop_dump_stream, "not safe");
2695
2696       if (loop_dump_stream)
2697         fprintf (loop_dump_stream, "\n");
2698     }
2699
2700   if (new_start == 0)
2701     new_start = loop_start;
2702
2703   /* Go through all the instructions in the loop, making
2704      all the register substitutions scheduled in REG_MAP.  */
2705   for (p = new_start; p != loop_end; p = NEXT_INSN (p))
2706     if (INSN_P (p))
2707       {
2708         replace_regs (PATTERN (p), reg_map, nregs, 0);
2709         replace_regs (REG_NOTES (p), reg_map, nregs, 0);
2710         INSN_CODE (p) = -1;
2711       }
2712
2713   /* Clean up.  */
2714   free (reg_map);
2715   free (already_moved);
2716 }
2717
2718
2719 static void
2720 loop_movables_add (struct loop_movables *movables, struct movable *m)
2721 {
2722   if (movables->head == 0)
2723     movables->head = m;
2724   else
2725     movables->last->next = m;
2726   movables->last = m;
2727 }
2728
2729
2730 static void
2731 loop_movables_free (struct loop_movables *movables)
2732 {
2733   struct movable *m;
2734   struct movable *m_next;
2735
2736   for (m = movables->head; m; m = m_next)
2737     {
2738       m_next = m->next;
2739       free (m);
2740     }
2741 }
2742 \f
2743 #if 0
2744 /* Scan X and replace the address of any MEM in it with ADDR.
2745    REG is the address that MEM should have before the replacement.  */
2746
2747 static void
2748 replace_call_address (rtx x, rtx reg, rtx addr)
2749 {
2750   enum rtx_code code;
2751   int i;
2752   const char *fmt;
2753
2754   if (x == 0)
2755     return;
2756   code = GET_CODE (x);
2757   switch (code)
2758     {
2759     case PC:
2760     case CC0:
2761     case CONST_INT:
2762     case CONST_DOUBLE:
2763     case CONST:
2764     case SYMBOL_REF:
2765     case LABEL_REF:
2766     case REG:
2767       return;
2768
2769     case SET:
2770       /* Short cut for very common case.  */
2771       replace_call_address (XEXP (x, 1), reg, addr);
2772       return;
2773
2774     case CALL:
2775       /* Short cut for very common case.  */
2776       replace_call_address (XEXP (x, 0), reg, addr);
2777       return;
2778
2779     case MEM:
2780       /* If this MEM uses a reg other than the one we expected,
2781          something is wrong.  */
2782       gcc_assert (XEXP (x, 0) == reg);
2783       XEXP (x, 0) = addr;
2784       return;
2785
2786     default:
2787       break;
2788     }
2789
2790   fmt = GET_RTX_FORMAT (code);
2791   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2792     {
2793       if (fmt[i] == 'e')
2794         replace_call_address (XEXP (x, i), reg, addr);
2795       else if (fmt[i] == 'E')
2796         {
2797           int j;
2798           for (j = 0; j < XVECLEN (x, i); j++)
2799             replace_call_address (XVECEXP (x, i, j), reg, addr);
2800         }
2801     }
2802 }
2803 #endif
2804 \f
2805 /* Return the number of memory refs to addresses that vary
2806    in the rtx X.  */
2807
2808 static int
2809 count_nonfixed_reads (const struct loop *loop, rtx x)
2810 {
2811   enum rtx_code code;
2812   int i;
2813   const char *fmt;
2814   int value;
2815
2816   if (x == 0)
2817     return 0;
2818
2819   code = GET_CODE (x);
2820   switch (code)
2821     {
2822     case PC:
2823     case CC0:
2824     case CONST_INT:
2825     case CONST_DOUBLE:
2826     case CONST:
2827     case SYMBOL_REF:
2828     case LABEL_REF:
2829     case REG:
2830       return 0;
2831
2832     case MEM:
2833       return ((loop_invariant_p (loop, XEXP (x, 0)) != 1)
2834               + count_nonfixed_reads (loop, XEXP (x, 0)));
2835
2836     default:
2837       break;
2838     }
2839
2840   value = 0;
2841   fmt = GET_RTX_FORMAT (code);
2842   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2843     {
2844       if (fmt[i] == 'e')
2845         value += count_nonfixed_reads (loop, XEXP (x, i));
2846       if (fmt[i] == 'E')
2847         {
2848           int j;
2849           for (j = 0; j < XVECLEN (x, i); j++)
2850             value += count_nonfixed_reads (loop, XVECEXP (x, i, j));
2851         }
2852     }
2853   return value;
2854 }
2855 \f
2856 /* Scan a loop setting the elements `loops_enclosed',
2857    `has_call', `has_nonconst_call', `has_volatile', `has_tablejump',
2858    `unknown_address_altered', `unknown_constant_address_altered', and
2859    `num_mem_sets' in LOOP.  Also, fill in the array `mems' and the
2860    list `store_mems' in LOOP.  */
2861
2862 static void
2863 prescan_loop (struct loop *loop)
2864 {
2865   int level = 1;
2866   rtx insn;
2867   struct loop_info *loop_info = LOOP_INFO (loop);
2868   rtx start = loop->start;
2869   rtx end = loop->end;
2870   /* The label after END.  Jumping here is just like falling off the
2871      end of the loop.  We use next_nonnote_insn instead of next_label
2872      as a hedge against the (pathological) case where some actual insn
2873      might end up between the two.  */
2874   rtx exit_target = next_nonnote_insn (end);
2875
2876   loop_info->has_indirect_jump = indirect_jump_in_function;
2877   loop_info->pre_header_has_call = 0;
2878   loop_info->has_call = 0;
2879   loop_info->has_nonconst_call = 0;
2880   loop_info->has_prefetch = 0;
2881   loop_info->has_volatile = 0;
2882   loop_info->has_tablejump = 0;
2883   loop_info->has_multiple_exit_targets = 0;
2884   loop->level = 1;
2885
2886   loop_info->unknown_address_altered = 0;
2887   loop_info->unknown_constant_address_altered = 0;
2888   loop_info->store_mems = NULL_RTX;
2889   loop_info->first_loop_store_insn = NULL_RTX;
2890   loop_info->mems_idx = 0;
2891   loop_info->num_mem_sets = 0;
2892
2893   for (insn = start; insn && !LABEL_P (insn);
2894        insn = PREV_INSN (insn))
2895     {
2896       if (CALL_P (insn))
2897         {
2898           loop_info->pre_header_has_call = 1;
2899           break;
2900         }
2901     }
2902
2903   for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2904        insn = NEXT_INSN (insn))
2905     {
2906       switch (GET_CODE (insn))
2907         {
2908         case NOTE:
2909           if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
2910             {
2911               ++level;
2912               /* Count number of loops contained in this one.  */
2913               loop->level++;
2914             }
2915           else if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_END)
2916             --level;
2917           break;
2918
2919         case CALL_INSN:
2920           if (! CONST_OR_PURE_CALL_P (insn))
2921             {
2922               loop_info->unknown_address_altered = 1;
2923               loop_info->has_nonconst_call = 1;
2924             }
2925           else if (pure_call_p (insn))
2926             loop_info->has_nonconst_call = 1;
2927           loop_info->has_call = 1;
2928           if (can_throw_internal (insn))
2929             loop_info->has_multiple_exit_targets = 1;
2930           break;
2931
2932         case JUMP_INSN:
2933           if (! loop_info->has_multiple_exit_targets)
2934             {
2935               rtx set = pc_set (insn);
2936
2937               if (set)
2938                 {
2939                   rtx src = SET_SRC (set);
2940                   rtx label1, label2;
2941
2942                   if (GET_CODE (src) == IF_THEN_ELSE)
2943                     {
2944                       label1 = XEXP (src, 1);
2945                       label2 = XEXP (src, 2);
2946                     }
2947                   else
2948                     {
2949                       label1 = src;
2950                       label2 = NULL_RTX;
2951                     }
2952
2953                   do
2954                     {
2955                       if (label1 && label1 != pc_rtx)
2956                         {
2957                           if (GET_CODE (label1) != LABEL_REF)
2958                             {
2959                               /* Something tricky.  */
2960                               loop_info->has_multiple_exit_targets = 1;
2961                               break;
2962                             }
2963                           else if (XEXP (label1, 0) != exit_target
2964                                    && LABEL_OUTSIDE_LOOP_P (label1))
2965                             {
2966                               /* A jump outside the current loop.  */
2967                               loop_info->has_multiple_exit_targets = 1;
2968                               break;
2969                             }
2970                         }
2971
2972                       label1 = label2;
2973                       label2 = NULL_RTX;
2974                     }
2975                   while (label1);
2976                 }
2977               else
2978                 {
2979                   /* A return, or something tricky.  */
2980                   loop_info->has_multiple_exit_targets = 1;
2981                 }
2982             }
2983           /* Fall through.  */
2984
2985         case INSN:
2986           if (volatile_refs_p (PATTERN (insn)))
2987             loop_info->has_volatile = 1;
2988
2989           if (JUMP_P (insn)
2990               && (GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC
2991                   || GET_CODE (PATTERN (insn)) == ADDR_VEC))
2992             loop_info->has_tablejump = 1;
2993
2994           note_stores (PATTERN (insn), note_addr_stored, loop_info);
2995           if (! loop_info->first_loop_store_insn && loop_info->store_mems)
2996             loop_info->first_loop_store_insn = insn;
2997
2998           if (flag_non_call_exceptions && can_throw_internal (insn))
2999             loop_info->has_multiple_exit_targets = 1;
3000           break;
3001
3002         default:
3003           break;
3004         }
3005     }
3006
3007   /* Now, rescan the loop, setting up the LOOP_MEMS array.  */
3008   if (/* An exception thrown by a called function might land us
3009          anywhere.  */
3010       ! loop_info->has_nonconst_call
3011       /* We don't want loads for MEMs moved to a location before the
3012          one at which their stack memory becomes allocated.  (Note
3013          that this is not a problem for malloc, etc., since those
3014          require actual function calls.  */
3015       && ! current_function_calls_alloca
3016       /* There are ways to leave the loop other than falling off the
3017          end.  */
3018       && ! loop_info->has_multiple_exit_targets)
3019     for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
3020          insn = NEXT_INSN (insn))
3021       for_each_rtx (&insn, insert_loop_mem, loop_info);
3022
3023   /* BLKmode MEMs are added to LOOP_STORE_MEM as necessary so
3024      that loop_invariant_p and load_mems can use true_dependence
3025      to determine what is really clobbered.  */
3026   if (loop_info->unknown_address_altered)
3027     {
3028       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
3029
3030       loop_info->store_mems
3031         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
3032     }
3033   if (loop_info->unknown_constant_address_altered)
3034     {
3035       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
3036       MEM_READONLY_P (mem) = 1;
3037       loop_info->store_mems
3038         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
3039     }
3040 }
3041 \f
3042 /* Invalidate all loops containing LABEL.  */
3043
3044 static void
3045 invalidate_loops_containing_label (rtx label)
3046 {
3047   struct loop *loop;
3048   for (loop = uid_loop[INSN_UID (label)]; loop; loop = loop->outer)
3049     loop->invalid = 1;
3050 }
3051
3052 /* Scan the function looking for loops.  Record the start and end of each loop.
3053    Also mark as invalid loops any loops that contain a setjmp or are branched
3054    to from outside the loop.  */
3055
3056 static void
3057 find_and_verify_loops (rtx f, struct loops *loops)
3058 {
3059   rtx insn;
3060   rtx label;
3061   int num_loops;
3062   struct loop *current_loop;
3063   struct loop *next_loop;
3064   struct loop *loop;
3065
3066   num_loops = loops->num;
3067
3068   compute_luids (f, NULL_RTX, 0);
3069
3070   /* If there are jumps to undefined labels,
3071      treat them as jumps out of any/all loops.
3072      This also avoids writing past end of tables when there are no loops.  */
3073   uid_loop[0] = NULL;
3074
3075   /* Find boundaries of loops, mark which loops are contained within
3076      loops, and invalidate loops that have setjmp.  */
3077
3078   num_loops = 0;
3079   current_loop = NULL;
3080   for (insn = f; insn; insn = NEXT_INSN (insn))
3081     {
3082       if (NOTE_P (insn))
3083         switch (NOTE_LINE_NUMBER (insn))
3084           {
3085           case NOTE_INSN_LOOP_BEG:
3086             next_loop = loops->array + num_loops;
3087             next_loop->num = num_loops;
3088             num_loops++;
3089             next_loop->start = insn;
3090             next_loop->outer = current_loop;
3091             current_loop = next_loop;
3092             break;
3093
3094           case NOTE_INSN_LOOP_END:
3095             gcc_assert (current_loop);
3096
3097             current_loop->end = insn;
3098             current_loop = current_loop->outer;
3099             break;
3100
3101           default:
3102             break;
3103           }
3104
3105       if (CALL_P (insn)
3106           && find_reg_note (insn, REG_SETJMP, NULL))
3107         {
3108           /* In this case, we must invalidate our current loop and any
3109              enclosing loop.  */
3110           for (loop = current_loop; loop; loop = loop->outer)
3111             {
3112               loop->invalid = 1;
3113               if (loop_dump_stream)
3114                 fprintf (loop_dump_stream,
3115                          "\nLoop at %d ignored due to setjmp.\n",
3116                          INSN_UID (loop->start));
3117             }
3118         }
3119
3120       /* Note that this will mark the NOTE_INSN_LOOP_END note as being in the
3121          enclosing loop, but this doesn't matter.  */
3122       uid_loop[INSN_UID (insn)] = current_loop;
3123     }
3124
3125   /* Any loop containing a label used in an initializer must be invalidated,
3126      because it can be jumped into from anywhere.  */
3127   for (label = forced_labels; label; label = XEXP (label, 1))
3128     invalidate_loops_containing_label (XEXP (label, 0));
3129
3130   /* Any loop containing a label used for an exception handler must be
3131      invalidated, because it can be jumped into from anywhere.  */
3132   for_each_eh_label (invalidate_loops_containing_label);
3133
3134   /* Now scan all insn's in the function.  If any JUMP_INSN branches into a
3135      loop that it is not contained within, that loop is marked invalid.
3136      If any INSN or CALL_INSN uses a label's address, then the loop containing
3137      that label is marked invalid, because it could be jumped into from
3138      anywhere.
3139
3140      Also look for blocks of code ending in an unconditional branch that
3141      exits the loop.  If such a block is surrounded by a conditional
3142      branch around the block, move the block elsewhere (see below) and
3143      invert the jump to point to the code block.  This may eliminate a
3144      label in our loop and will simplify processing by both us and a
3145      possible second cse pass.  */
3146
3147   for (insn = f; insn; insn = NEXT_INSN (insn))
3148     if (INSN_P (insn))
3149       {
3150         struct loop *this_loop = uid_loop[INSN_UID (insn)];
3151
3152         if (NONJUMP_INSN_P (insn) || CALL_P (insn))
3153           {
3154             rtx note = find_reg_note (insn, REG_LABEL, NULL_RTX);
3155             if (note)
3156               invalidate_loops_containing_label (XEXP (note, 0));
3157           }
3158
3159         if (!JUMP_P (insn))
3160           continue;
3161
3162         mark_loop_jump (PATTERN (insn), this_loop);
3163
3164         /* See if this is an unconditional branch outside the loop.  */
3165         if (this_loop
3166             && (GET_CODE (PATTERN (insn)) == RETURN
3167                 || (any_uncondjump_p (insn)
3168                     && onlyjump_p (insn)
3169                     && (uid_loop[INSN_UID (JUMP_LABEL (insn))]
3170                         != this_loop)))
3171             && get_max_uid () < max_uid_for_loop)
3172           {
3173             rtx p;
3174             rtx our_next = next_real_insn (insn);
3175             rtx last_insn_to_move = NEXT_INSN (insn);
3176             struct loop *dest_loop;
3177             struct loop *outer_loop = NULL;
3178
3179             /* Go backwards until we reach the start of the loop, a label,
3180                or a JUMP_INSN.  */
3181             for (p = PREV_INSN (insn);
3182                  !LABEL_P (p)
3183                  && ! (NOTE_P (p)
3184                        && NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
3185                  && !JUMP_P (p);
3186                  p = PREV_INSN (p))
3187               ;
3188
3189             /* Check for the case where we have a jump to an inner nested
3190                loop, and do not perform the optimization in that case.  */
3191
3192             if (JUMP_LABEL (insn))
3193               {
3194                 dest_loop = uid_loop[INSN_UID (JUMP_LABEL (insn))];
3195                 if (dest_loop)
3196                   {
3197                     for (outer_loop = dest_loop; outer_loop;
3198                          outer_loop = outer_loop->outer)
3199                       if (outer_loop == this_loop)
3200                         break;
3201                   }
3202               }
3203
3204             /* Make sure that the target of P is within the current loop.  */
3205
3206             if (JUMP_P (p) && JUMP_LABEL (p)
3207                 && uid_loop[INSN_UID (JUMP_LABEL (p))] != this_loop)
3208               outer_loop = this_loop;
3209
3210             /* If we stopped on a JUMP_INSN to the next insn after INSN,
3211                we have a block of code to try to move.
3212
3213                We look backward and then forward from the target of INSN
3214                to find a BARRIER at the same loop depth as the target.
3215                If we find such a BARRIER, we make a new label for the start
3216                of the block, invert the jump in P and point it to that label,
3217                and move the block of code to the spot we found.  */
3218
3219             if (! outer_loop
3220                 && JUMP_P (p)
3221                 && JUMP_LABEL (p) != 0
3222                 /* Just ignore jumps to labels that were never emitted.
3223                    These always indicate compilation errors.  */
3224                 && INSN_UID (JUMP_LABEL (p)) != 0
3225                 && any_condjump_p (p) && onlyjump_p (p)
3226                 && next_real_insn (JUMP_LABEL (p)) == our_next
3227                 /* If it's not safe to move the sequence, then we
3228                    mustn't try.  */
3229                 && insns_safe_to_move_p (p, NEXT_INSN (insn),
3230                                          &last_insn_to_move))
3231               {
3232                 rtx target
3233                   = JUMP_LABEL (insn) ? JUMP_LABEL (insn) : get_last_insn ();
3234                 struct loop *target_loop = uid_loop[INSN_UID (target)];
3235                 rtx loc, loc2;
3236                 rtx tmp;
3237
3238                 /* Search for possible garbage past the conditional jumps
3239                    and look for the last barrier.  */
3240                 for (tmp = last_insn_to_move;
3241                      tmp && !LABEL_P (tmp); tmp = NEXT_INSN (tmp))
3242                   if (BARRIER_P (tmp))
3243                     last_insn_to_move = tmp;
3244
3245                 for (loc = target; loc; loc = PREV_INSN (loc))
3246                   if (BARRIER_P (loc)
3247                       /* Don't move things inside a tablejump.  */
3248                       && ((loc2 = next_nonnote_insn (loc)) == 0
3249                           || !LABEL_P (loc2)
3250                           || (loc2 = next_nonnote_insn (loc2)) == 0
3251                           || !JUMP_P (loc2)
3252                           || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
3253                               && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
3254                       && uid_loop[INSN_UID (loc)] == target_loop)
3255                     break;
3256
3257                 if (loc == 0)
3258                   for (loc = target; loc; loc = NEXT_INSN (loc))
3259                     if (BARRIER_P (loc)
3260                         /* Don't move things inside a tablejump.  */
3261                         && ((loc2 = next_nonnote_insn (loc)) == 0
3262                             || !LABEL_P (loc2)
3263                             || (loc2 = next_nonnote_insn (loc2)) == 0
3264                             || !JUMP_P (loc2)
3265                             || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
3266                                 && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
3267                         && uid_loop[INSN_UID (loc)] == target_loop)
3268                       break;
3269
3270                 if (loc)
3271                   {
3272                     rtx cond_label = JUMP_LABEL (p);
3273                     rtx new_label = get_label_after (p);
3274
3275                     /* Ensure our label doesn't go away.  */
3276                     LABEL_NUSES (cond_label)++;
3277
3278                     /* Verify that uid_loop is large enough and that
3279                        we can invert P.  */
3280                     if (invert_jump (p, new_label, 1))
3281                       {
3282                         rtx q, r;
3283
3284                         /* If no suitable BARRIER was found, create a suitable
3285                            one before TARGET.  Since TARGET is a fall through
3286                            path, we'll need to insert a jump around our block
3287                            and add a BARRIER before TARGET.
3288
3289                            This creates an extra unconditional jump outside
3290                            the loop.  However, the benefits of removing rarely
3291                            executed instructions from inside the loop usually
3292                            outweighs the cost of the extra unconditional jump
3293                            outside the loop.  */
3294                         if (loc == 0)
3295                           {
3296                             rtx temp;
3297
3298                             temp = gen_jump (JUMP_LABEL (insn));
3299                             temp = emit_jump_insn_before (temp, target);
3300                             JUMP_LABEL (temp) = JUMP_LABEL (insn);
3301                             LABEL_NUSES (JUMP_LABEL (insn))++;
3302                             loc = emit_barrier_before (target);
3303                           }
3304
3305                         /* Include the BARRIER after INSN and copy the
3306                            block after LOC.  */
3307                         if (squeeze_notes (&new_label, &last_insn_to_move))
3308                           abort ();
3309                         reorder_insns (new_label, last_insn_to_move, loc);
3310
3311                         /* All those insns are now in TARGET_LOOP.  */
3312                         for (q = new_label;
3313                              q != NEXT_INSN (last_insn_to_move);
3314                              q = NEXT_INSN (q))
3315                           uid_loop[INSN_UID (q)] = target_loop;
3316
3317                         /* The label jumped to by INSN is no longer a loop
3318                            exit.  Unless INSN does not have a label (e.g.,
3319                            it is a RETURN insn), search loop->exit_labels
3320                            to find its label_ref, and remove it.  Also turn
3321                            off LABEL_OUTSIDE_LOOP_P bit.  */
3322                         if (JUMP_LABEL (insn))
3323                           {
3324                             for (q = 0, r = this_loop->exit_labels;
3325                                  r;
3326                                  q = r, r = LABEL_NEXTREF (r))
3327                               if (XEXP (r, 0) == JUMP_LABEL (insn))
3328                                 {
3329                                   LABEL_OUTSIDE_LOOP_P (r) = 0;
3330                                   if (q)
3331                                     LABEL_NEXTREF (q) = LABEL_NEXTREF (r);
3332                                   else
3333                                     this_loop->exit_labels = LABEL_NEXTREF (r);
3334                                   break;
3335                                 }
3336
3337                             for (loop = this_loop; loop && loop != target_loop;
3338                                  loop = loop->outer)
3339                               loop->exit_count--;
3340
3341                             /* If we didn't find it, then something is
3342                                wrong.  */
3343                             gcc_assert (r);
3344                           }
3345
3346                         /* P is now a jump outside the loop, so it must be put
3347                            in loop->exit_labels, and marked as such.
3348                            The easiest way to do this is to just call
3349                            mark_loop_jump again for P.  */
3350                         mark_loop_jump (PATTERN (p), this_loop);
3351
3352                         /* If INSN now jumps to the insn after it,
3353                            delete INSN.  */
3354                         if (JUMP_LABEL (insn) != 0
3355                             && (next_real_insn (JUMP_LABEL (insn))
3356                                 == next_real_insn (insn)))
3357                           delete_related_insns (insn);
3358                       }
3359
3360                     /* Continue the loop after where the conditional
3361                        branch used to jump, since the only branch insn
3362                        in the block (if it still remains) is an inter-loop
3363                        branch and hence needs no processing.  */
3364                     insn = NEXT_INSN (cond_label);
3365
3366                     if (--LABEL_NUSES (cond_label) == 0)
3367                       delete_related_insns (cond_label);
3368
3369                     /* This loop will be continued with NEXT_INSN (insn).  */
3370                     insn = PREV_INSN (insn);
3371                   }
3372               }
3373           }
3374       }
3375 }
3376
3377 /* If any label in X jumps to a loop different from LOOP_NUM and any of the
3378    loops it is contained in, mark the target loop invalid.
3379
3380    For speed, we assume that X is part of a pattern of a JUMP_INSN.  */
3381
3382 static void
3383 mark_loop_jump (rtx x, struct loop *loop)
3384 {
3385   struct loop *dest_loop;
3386   struct loop *outer_loop;
3387   int i;
3388
3389   switch (GET_CODE (x))
3390     {
3391     case PC:
3392     case USE:
3393     case CLOBBER:
3394     case REG:
3395     case MEM:
3396     case CONST_INT:
3397     case CONST_DOUBLE:
3398     case RETURN:
3399       return;
3400
3401     case CONST:
3402       /* There could be a label reference in here.  */
3403       mark_loop_jump (XEXP (x, 0), loop);
3404       return;
3405
3406     case PLUS:
3407     case MINUS:
3408     case MULT:
3409       mark_loop_jump (XEXP (x, 0), loop);
3410       mark_loop_jump (XEXP (x, 1), loop);
3411       return;
3412
3413     case LO_SUM:
3414       /* This may refer to a LABEL_REF or SYMBOL_REF.  */
3415       mark_loop_jump (XEXP (x, 1), loop);
3416       return;
3417
3418     case SIGN_EXTEND:
3419     case ZERO_EXTEND:
3420       mark_loop_jump (XEXP (x, 0), loop);
3421       return;
3422
3423     case LABEL_REF:
3424       dest_loop = uid_loop[INSN_UID (XEXP (x, 0))];
3425
3426       /* Link together all labels that branch outside the loop.  This
3427          is used by final_[bg]iv_value and the loop unrolling code.  Also
3428          mark this LABEL_REF so we know that this branch should predict
3429          false.  */
3430
3431       /* A check to make sure the label is not in an inner nested loop,
3432          since this does not count as a loop exit.  */
3433       if (dest_loop)
3434         {
3435           for (outer_loop = dest_loop; outer_loop;
3436                outer_loop = outer_loop->outer)
3437             if (outer_loop == loop)
3438               break;
3439         }
3440       else
3441         outer_loop = NULL;
3442
3443       if (loop && ! outer_loop)
3444         {
3445           LABEL_OUTSIDE_LOOP_P (x) = 1;
3446           LABEL_NEXTREF (x) = loop->exit_labels;
3447           loop->exit_labels = x;
3448
3449           for (outer_loop = loop;
3450                outer_loop && outer_loop != dest_loop;
3451                outer_loop = outer_loop->outer)
3452             outer_loop->exit_count++;
3453         }
3454
3455       /* If this is inside a loop, but not in the current loop or one enclosed
3456          by it, it invalidates at least one loop.  */
3457
3458       if (! dest_loop)
3459         return;
3460
3461       /* We must invalidate every nested loop containing the target of this
3462          label, except those that also contain the jump insn.  */
3463
3464       for (; dest_loop; dest_loop = dest_loop->outer)
3465         {
3466           /* Stop when we reach a loop that also contains the jump insn.  */
3467           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3468             if (dest_loop == outer_loop)
3469               return;
3470
3471           /* If we get here, we know we need to invalidate a loop.  */
3472           if (loop_dump_stream && ! dest_loop->invalid)
3473             fprintf (loop_dump_stream,
3474                      "\nLoop at %d ignored due to multiple entry points.\n",
3475                      INSN_UID (dest_loop->start));
3476
3477           dest_loop->invalid = 1;
3478         }
3479       return;
3480
3481     case SET:
3482       /* If this is not setting pc, ignore.  */
3483       if (SET_DEST (x) == pc_rtx)
3484         mark_loop_jump (SET_SRC (x), loop);
3485       return;
3486
3487     case IF_THEN_ELSE:
3488       mark_loop_jump (XEXP (x, 1), loop);
3489       mark_loop_jump (XEXP (x, 2), loop);
3490       return;
3491
3492     case PARALLEL:
3493     case ADDR_VEC:
3494       for (i = 0; i < XVECLEN (x, 0); i++)
3495         mark_loop_jump (XVECEXP (x, 0, i), loop);
3496       return;
3497
3498     case ADDR_DIFF_VEC:
3499       for (i = 0; i < XVECLEN (x, 1); i++)
3500         mark_loop_jump (XVECEXP (x, 1, i), loop);
3501       return;
3502
3503     default:
3504       /* Strictly speaking this is not a jump into the loop, only a possible
3505          jump out of the loop.  However, we have no way to link the destination
3506          of this jump onto the list of exit labels.  To be safe we mark this
3507          loop and any containing loops as invalid.  */
3508       if (loop)
3509         {
3510           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3511             {
3512               if (loop_dump_stream && ! outer_loop->invalid)
3513                 fprintf (loop_dump_stream,
3514                          "\nLoop at %d ignored due to unknown exit jump.\n",
3515                          INSN_UID (outer_loop->start));
3516               outer_loop->invalid = 1;
3517             }
3518         }
3519       return;
3520     }
3521 }
3522 \f
3523 /* Return nonzero if there is a label in the range from
3524    insn INSN to and including the insn whose luid is END
3525    INSN must have an assigned luid (i.e., it must not have
3526    been previously created by loop.c).  */
3527
3528 static int
3529 labels_in_range_p (rtx insn, int end)
3530 {
3531   while (insn && INSN_LUID (insn) <= end)
3532     {
3533       if (LABEL_P (insn))
3534         return 1;
3535       insn = NEXT_INSN (insn);
3536     }
3537
3538   return 0;
3539 }
3540
3541 /* Record that a memory reference X is being set.  */
3542
3543 static void
3544 note_addr_stored (rtx x, rtx y ATTRIBUTE_UNUSED,
3545                   void *data ATTRIBUTE_UNUSED)
3546 {
3547   struct loop_info *loop_info = data;
3548
3549   if (x == 0 || !MEM_P (x))
3550     return;
3551
3552   /* Count number of memory writes.
3553      This affects heuristics in strength_reduce.  */
3554   loop_info->num_mem_sets++;
3555
3556   /* BLKmode MEM means all memory is clobbered.  */
3557   if (GET_MODE (x) == BLKmode)
3558     {
3559       if (MEM_READONLY_P (x))
3560         loop_info->unknown_constant_address_altered = 1;
3561       else
3562         loop_info->unknown_address_altered = 1;
3563
3564       return;
3565     }
3566
3567   loop_info->store_mems = gen_rtx_EXPR_LIST (VOIDmode, x,
3568                                              loop_info->store_mems);
3569 }
3570
3571 /* X is a value modified by an INSN that references a biv inside a loop
3572    exit test (i.e., X is somehow related to the value of the biv).  If X
3573    is a pseudo that is used more than once, then the biv is (effectively)
3574    used more than once.  DATA is a pointer to a loop_regs structure.  */
3575
3576 static void
3577 note_set_pseudo_multiple_uses (rtx x, rtx y ATTRIBUTE_UNUSED, void *data)
3578 {
3579   struct loop_regs *regs = (struct loop_regs *) data;
3580
3581   if (x == 0)
3582     return;
3583
3584   while (GET_CODE (x) == STRICT_LOW_PART
3585          || GET_CODE (x) == SIGN_EXTRACT
3586          || GET_CODE (x) == ZERO_EXTRACT
3587          || GET_CODE (x) == SUBREG)
3588     x = XEXP (x, 0);
3589
3590   if (!REG_P (x) || REGNO (x) < FIRST_PSEUDO_REGISTER)
3591     return;
3592
3593   /* If we do not have usage information, or if we know the register
3594      is used more than once, note that fact for check_dbra_loop.  */
3595   if (REGNO (x) >= max_reg_before_loop
3596       || ! regs->array[REGNO (x)].single_usage
3597       || regs->array[REGNO (x)].single_usage == const0_rtx)
3598     regs->multiple_uses = 1;
3599 }
3600 \f
3601 /* Return nonzero if the rtx X is invariant over the current loop.
3602
3603    The value is 2 if we refer to something only conditionally invariant.
3604
3605    A memory ref is invariant if it is not volatile and does not conflict
3606    with anything stored in `loop_info->store_mems'.  */
3607
3608 static int
3609 loop_invariant_p (const struct loop *loop, rtx x)
3610 {
3611   struct loop_info *loop_info = LOOP_INFO (loop);
3612   struct loop_regs *regs = LOOP_REGS (loop);
3613   int i;
3614   enum rtx_code code;
3615   const char *fmt;
3616   int conditional = 0;
3617   rtx mem_list_entry;
3618
3619   if (x == 0)
3620     return 1;
3621   code = GET_CODE (x);
3622   switch (code)
3623     {
3624     case CONST_INT:
3625     case CONST_DOUBLE:
3626     case SYMBOL_REF:
3627     case CONST:
3628       return 1;
3629
3630     case LABEL_REF:
3631       return 1;
3632
3633     case PC:
3634     case CC0:
3635     case UNSPEC_VOLATILE:
3636       return 0;
3637
3638     case REG:
3639       if ((x == frame_pointer_rtx || x == hard_frame_pointer_rtx
3640            || x == arg_pointer_rtx || x == pic_offset_table_rtx)
3641           && ! current_function_has_nonlocal_goto)
3642         return 1;
3643
3644       if (LOOP_INFO (loop)->has_call
3645           && REGNO (x) < FIRST_PSEUDO_REGISTER && call_used_regs[REGNO (x)])
3646         return 0;
3647
3648       /* Out-of-range regs can occur when we are called from unrolling.
3649          These registers created by the unroller are set in the loop,
3650          hence are never invariant.
3651          Other out-of-range regs can be generated by load_mems; those that
3652          are written to in the loop are not invariant, while those that are
3653          not written to are invariant.  It would be easy for load_mems
3654          to set n_times_set correctly for these registers, however, there
3655          is no easy way to distinguish them from registers created by the
3656          unroller.  */
3657
3658       if (REGNO (x) >= (unsigned) regs->num)
3659         return 0;
3660
3661       if (regs->array[REGNO (x)].set_in_loop < 0)
3662         return 2;
3663
3664       return regs->array[REGNO (x)].set_in_loop == 0;
3665
3666     case MEM:
3667       /* Volatile memory references must be rejected.  Do this before
3668          checking for read-only items, so that volatile read-only items
3669          will be rejected also.  */
3670       if (MEM_VOLATILE_P (x))
3671         return 0;
3672
3673       /* See if there is any dependence between a store and this load.  */
3674       mem_list_entry = loop_info->store_mems;
3675       while (mem_list_entry)
3676         {
3677           if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
3678                                x, rtx_varies_p))
3679             return 0;
3680
3681           mem_list_entry = XEXP (mem_list_entry, 1);
3682         }
3683
3684       /* It's not invalidated by a store in memory
3685          but we must still verify the address is invariant.  */
3686       break;
3687
3688     case ASM_OPERANDS:
3689       /* Don't mess with insns declared volatile.  */
3690       if (MEM_VOLATILE_P (x))
3691         return 0;
3692       break;
3693
3694     default:
3695       break;
3696     }
3697
3698   fmt = GET_RTX_FORMAT (code);
3699   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3700     {
3701       if (fmt[i] == 'e')
3702         {
3703           int tem = loop_invariant_p (loop, XEXP (x, i));
3704           if (tem == 0)
3705             return 0;
3706           if (tem == 2)
3707             conditional = 1;
3708         }
3709       else if (fmt[i] == 'E')
3710         {
3711           int j;
3712           for (j = 0; j < XVECLEN (x, i); j++)
3713             {
3714               int tem = loop_invariant_p (loop, XVECEXP (x, i, j));
3715               if (tem == 0)
3716                 return 0;
3717               if (tem == 2)
3718                 conditional = 1;
3719             }
3720
3721         }
3722     }
3723
3724   return 1 + conditional;
3725 }
3726 \f
3727 /* Return nonzero if all the insns in the loop that set REG
3728    are INSN and the immediately following insns,
3729    and if each of those insns sets REG in an invariant way
3730    (not counting uses of REG in them).
3731
3732    The value is 2 if some of these insns are only conditionally invariant.
3733
3734    We assume that INSN itself is the first set of REG
3735    and that its source is invariant.  */
3736
3737 static int
3738 consec_sets_invariant_p (const struct loop *loop, rtx reg, int n_sets,
3739                          rtx insn)
3740 {
3741   struct loop_regs *regs = LOOP_REGS (loop);
3742   rtx p = insn;
3743   unsigned int regno = REGNO (reg);
3744   rtx temp;
3745   /* Number of sets we have to insist on finding after INSN.  */
3746   int count = n_sets - 1;
3747   int old = regs->array[regno].set_in_loop;
3748   int value = 0;
3749   int this;
3750
3751   /* If N_SETS hit the limit, we can't rely on its value.  */
3752   if (n_sets == 127)
3753     return 0;
3754
3755   regs->array[regno].set_in_loop = 0;
3756
3757   while (count > 0)
3758     {
3759       enum rtx_code code;
3760       rtx set;
3761
3762       p = NEXT_INSN (p);
3763       code = GET_CODE (p);
3764
3765       /* If library call, skip to end of it.  */
3766       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
3767         p = XEXP (temp, 0);
3768
3769       this = 0;
3770       if (code == INSN
3771           && (set = single_set (p))
3772           && REG_P (SET_DEST (set))
3773           && REGNO (SET_DEST (set)) == regno)
3774         {
3775           this = loop_invariant_p (loop, SET_SRC (set));
3776           if (this != 0)
3777             value |= this;
3778           else if ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX)))
3779             {
3780               /* If this is a libcall, then any invariant REG_EQUAL note is OK.
3781                  If this is an ordinary insn, then only CONSTANT_P REG_EQUAL
3782                  notes are OK.  */
3783               this = (CONSTANT_P (XEXP (temp, 0))
3784                       || (find_reg_note (p, REG_RETVAL, NULL_RTX)
3785                           && loop_invariant_p (loop, XEXP (temp, 0))));
3786               if (this != 0)
3787                 value |= this;
3788             }
3789         }
3790       if (this != 0)
3791         count--;
3792       else if (code != NOTE)
3793         {
3794           regs->array[regno].set_in_loop = old;
3795           return 0;
3796         }
3797     }
3798
3799   regs->array[regno].set_in_loop = old;
3800   /* If loop_invariant_p ever returned 2, we return 2.  */
3801   return 1 + (value & 2);
3802 }
3803 \f
3804 /* Look at all uses (not sets) of registers in X.  For each, if it is
3805    the single use, set USAGE[REGNO] to INSN; if there was a previous use in
3806    a different insn, set USAGE[REGNO] to const0_rtx.  */
3807
3808 static void
3809 find_single_use_in_loop (struct loop_regs *regs, rtx insn, rtx x)
3810 {
3811   enum rtx_code code = GET_CODE (x);
3812   const char *fmt = GET_RTX_FORMAT (code);
3813   int i, j;
3814
3815   if (code == REG)
3816     regs->array[REGNO (x)].single_usage
3817       = (regs->array[REGNO (x)].single_usage != 0
3818          && regs->array[REGNO (x)].single_usage != insn)
3819         ? const0_rtx : insn;
3820
3821   else if (code == SET)
3822     {
3823       /* Don't count SET_DEST if it is a REG; otherwise count things
3824          in SET_DEST because if a register is partially modified, it won't
3825          show up as a potential movable so we don't care how USAGE is set
3826          for it.  */
3827       if (!REG_P (SET_DEST (x)))
3828         find_single_use_in_loop (regs, insn, SET_DEST (x));
3829       find_single_use_in_loop (regs, insn, SET_SRC (x));
3830     }
3831   else
3832     for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3833       {
3834         if (fmt[i] == 'e' && XEXP (x, i) != 0)
3835           find_single_use_in_loop (regs, insn, XEXP (x, i));
3836         else if (fmt[i] == 'E')
3837           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
3838             find_single_use_in_loop (regs, insn, XVECEXP (x, i, j));
3839       }
3840 }
3841 \f
3842 /* Count and record any set in X which is contained in INSN.  Update
3843    REGS->array[I].MAY_NOT_OPTIMIZE and LAST_SET for any register I set
3844    in X.  */
3845
3846 static void
3847 count_one_set (struct loop_regs *regs, rtx insn, rtx x, rtx *last_set)
3848 {
3849   if (GET_CODE (x) == CLOBBER && REG_P (XEXP (x, 0)))
3850     /* Don't move a reg that has an explicit clobber.
3851        It's not worth the pain to try to do it correctly.  */
3852     regs->array[REGNO (XEXP (x, 0))].may_not_optimize = 1;
3853
3854   if (GET_CODE (x) == SET || GET_CODE (x) == CLOBBER)
3855     {
3856       rtx dest = SET_DEST (x);
3857       while (GET_CODE (dest) == SUBREG
3858              || GET_CODE (dest) == ZERO_EXTRACT
3859              || GET_CODE (dest) == STRICT_LOW_PART)
3860         dest = XEXP (dest, 0);
3861       if (REG_P (dest))
3862         {
3863           int i;
3864           int regno = REGNO (dest);
3865           for (i = 0; i < LOOP_REGNO_NREGS (regno, dest); i++)
3866             {
3867               /* If this is the first setting of this reg
3868                  in current basic block, and it was set before,
3869                  it must be set in two basic blocks, so it cannot
3870                  be moved out of the loop.  */
3871               if (regs->array[regno].set_in_loop > 0
3872                   && last_set[regno] == 0)
3873                 regs->array[regno+i].may_not_optimize = 1;
3874               /* If this is not first setting in current basic block,
3875                  see if reg was used in between previous one and this.
3876                  If so, neither one can be moved.  */
3877               if (last_set[regno] != 0
3878                   && reg_used_between_p (dest, last_set[regno], insn))
3879                 regs->array[regno+i].may_not_optimize = 1;
3880               if (regs->array[regno+i].set_in_loop < 127)
3881                 ++regs->array[regno+i].set_in_loop;
3882               last_set[regno+i] = insn;
3883             }
3884         }
3885     }
3886 }
3887 \f
3888 /* Given a loop that is bounded by LOOP->START and LOOP->END and that
3889    is entered at LOOP->SCAN_START, return 1 if the register set in SET
3890    contained in insn INSN is used by any insn that precedes INSN in
3891    cyclic order starting from the loop entry point.
3892
3893    We don't want to use INSN_LUID here because if we restrict INSN to those
3894    that have a valid INSN_LUID, it means we cannot move an invariant out
3895    from an inner loop past two loops.  */
3896
3897 static int
3898 loop_reg_used_before_p (const struct loop *loop, rtx set, rtx insn)
3899 {
3900   rtx reg = SET_DEST (set);
3901   rtx p;
3902
3903   /* Scan forward checking for register usage.  If we hit INSN, we
3904      are done.  Otherwise, if we hit LOOP->END, wrap around to LOOP->START.  */
3905   for (p = loop->scan_start; p != insn; p = NEXT_INSN (p))
3906     {
3907       if (INSN_P (p) && reg_overlap_mentioned_p (reg, PATTERN (p)))
3908         return 1;
3909
3910       if (p == loop->end)
3911         p = loop->start;
3912     }
3913
3914   return 0;
3915 }
3916 \f
3917
3918 /* Information we collect about arrays that we might want to prefetch.  */
3919 struct prefetch_info
3920 {
3921   struct iv_class *class;       /* Class this prefetch is based on.  */
3922   struct induction *giv;        /* GIV this prefetch is based on.  */
3923   rtx base_address;             /* Start prefetching from this address plus
3924                                    index.  */
3925   HOST_WIDE_INT index;
3926   HOST_WIDE_INT stride;         /* Prefetch stride in bytes in each
3927                                    iteration.  */
3928   unsigned int bytes_accessed;  /* Sum of sizes of all accesses to this
3929                                    prefetch area in one iteration.  */
3930   unsigned int total_bytes;     /* Total bytes loop will access in this block.
3931                                    This is set only for loops with known
3932                                    iteration counts and is 0xffffffff
3933                                    otherwise.  */
3934   int prefetch_in_loop;         /* Number of prefetch insns in loop.  */
3935   int prefetch_before_loop;     /* Number of prefetch insns before loop.  */
3936   unsigned int write : 1;       /* 1 for read/write prefetches.  */
3937 };
3938
3939 /* Data used by check_store function.  */
3940 struct check_store_data
3941 {
3942   rtx mem_address;
3943   int mem_write;
3944 };
3945
3946 static void check_store (rtx, rtx, void *);
3947 static void emit_prefetch_instructions (struct loop *);
3948 static int rtx_equal_for_prefetch_p (rtx, rtx);
3949
3950 /* Set mem_write when mem_address is found.  Used as callback to
3951    note_stores.  */
3952 static void
3953 check_store (rtx x, rtx pat ATTRIBUTE_UNUSED, void *data)
3954 {
3955   struct check_store_data *d = (struct check_store_data *) data;
3956
3957   if ((MEM_P (x)) && rtx_equal_p (d->mem_address, XEXP (x, 0)))
3958     d->mem_write = 1;
3959 }
3960 \f
3961 /* Like rtx_equal_p, but attempts to swap commutative operands.  This is
3962    important to get some addresses combined.  Later more sophisticated
3963    transformations can be added when necessary.
3964
3965    ??? Same trick with swapping operand is done at several other places.
3966    It can be nice to develop some common way to handle this.  */
3967
3968 static int
3969 rtx_equal_for_prefetch_p (rtx x, rtx y)
3970 {
3971   int i;
3972   int j;
3973   enum rtx_code code = GET_CODE (x);
3974   const char *fmt;
3975
3976   if (x == y)
3977     return 1;
3978   if (code != GET_CODE (y))
3979     return 0;
3980
3981   if (COMMUTATIVE_ARITH_P (x))
3982     {
3983       return ((rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 0))
3984                && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 1)))
3985               || (rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 1))
3986                   && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 0))));
3987     }
3988
3989   /* Compare the elements.  If any pair of corresponding elements fails to
3990      match, return 0 for the whole thing.  */
3991
3992   fmt = GET_RTX_FORMAT (code);
3993   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3994     {
3995       switch (fmt[i])
3996         {
3997         case 'w':
3998           if (XWINT (x, i) != XWINT (y, i))
3999             return 0;
4000           break;
4001
4002         case 'i':
4003           if (XINT (x, i) != XINT (y, i))
4004             return 0;
4005           break;
4006
4007         case 'E':
4008           /* Two vectors must have the same length.  */
4009           if (XVECLEN (x, i) != XVECLEN (y, i))
4010             return 0;
4011
4012           /* And the corresponding elements must match.  */
4013           for (j = 0; j < XVECLEN (x, i); j++)
4014             if (rtx_equal_for_prefetch_p (XVECEXP (x, i, j),
4015                                           XVECEXP (y, i, j)) == 0)
4016               return 0;
4017           break;
4018
4019         case 'e':
4020           if (rtx_equal_for_prefetch_p (XEXP (x, i), XEXP (y, i)) == 0)
4021             return 0;
4022           break;
4023
4024         case 's':
4025           if (strcmp (XSTR (x, i), XSTR (y, i)))
4026             return 0;
4027           break;
4028
4029         case 'u':
4030           /* These are just backpointers, so they don't matter.  */
4031           break;
4032
4033         case '0':
4034           break;
4035
4036           /* It is believed that rtx's at this level will never
4037              contain anything but integers and other rtx's,
4038              except for within LABEL_REFs and SYMBOL_REFs.  */
4039         default:
4040           gcc_unreachable ();
4041         }
4042     }
4043   return 1;
4044 }
4045 \f
4046 /* Remove constant addition value from the expression X (when present)
4047    and return it.  */
4048
4049 static HOST_WIDE_INT
4050 remove_constant_addition (rtx *x)
4051 {
4052   HOST_WIDE_INT addval = 0;
4053   rtx exp = *x;
4054
4055   /* Avoid clobbering a shared CONST expression.  */
4056   if (GET_CODE (exp) == CONST)
4057     {
4058       if (GET_CODE (XEXP (exp, 0)) == PLUS
4059           && GET_CODE (XEXP (XEXP (exp, 0), 0)) == SYMBOL_REF
4060           && GET_CODE (XEXP (XEXP (exp, 0), 1)) == CONST_INT)
4061         {
4062           *x = XEXP (XEXP (exp, 0), 0);
4063           return INTVAL (XEXP (XEXP (exp, 0), 1));
4064         }
4065       return 0;
4066     }
4067
4068   if (GET_CODE (exp) == CONST_INT)
4069     {
4070       addval = INTVAL (exp);
4071       *x = const0_rtx;
4072     }
4073
4074   /* For plus expression recurse on ourself.  */
4075   else if (GET_CODE (exp) == PLUS)
4076     {
4077       addval += remove_constant_addition (&XEXP (exp, 0));
4078       addval += remove_constant_addition (&XEXP (exp, 1));
4079
4080       /* In case our parameter was constant, remove extra zero from the
4081          expression.  */
4082       if (XEXP (exp, 0) == const0_rtx)
4083         *x = XEXP (exp, 1);
4084       else if (XEXP (exp, 1) == const0_rtx)
4085         *x = XEXP (exp, 0);
4086     }
4087
4088   return addval;
4089 }
4090
4091 /* Attempt to identify accesses to arrays that are most likely to cause cache
4092    misses, and emit prefetch instructions a few prefetch blocks forward.
4093
4094    To detect the arrays we use the GIV information that was collected by the
4095    strength reduction pass.
4096
4097    The prefetch instructions are generated after the GIV information is done
4098    and before the strength reduction process. The new GIVs are injected into
4099    the strength reduction tables, so the prefetch addresses are optimized as
4100    well.
4101
4102    GIVs are split into base address, stride, and constant addition values.
4103    GIVs with the same address, stride and close addition values are combined
4104    into a single prefetch.  Also writes to GIVs are detected, so that prefetch
4105    for write instructions can be used for the block we write to, on machines
4106    that support write prefetches.
4107
4108    Several heuristics are used to determine when to prefetch.  They are
4109    controlled by defined symbols that can be overridden for each target.  */
4110
4111 static void
4112 emit_prefetch_instructions (struct loop *loop)
4113 {
4114   int num_prefetches = 0;
4115   int num_real_prefetches = 0;
4116   int num_real_write_prefetches = 0;
4117   int num_prefetches_before = 0;
4118   int num_write_prefetches_before = 0;
4119   int ahead = 0;
4120   int i;
4121   struct iv_class *bl;
4122   struct induction *iv;
4123   struct prefetch_info info[MAX_PREFETCHES];
4124   struct loop_ivs *ivs = LOOP_IVS (loop);
4125
4126   if (!HAVE_prefetch || PREFETCH_BLOCK == 0)
4127     return;
4128
4129   /* Consider only loops w/o calls.  When a call is done, the loop is probably
4130      slow enough to read the memory.  */
4131   if (PREFETCH_NO_CALL && LOOP_INFO (loop)->has_call)
4132     {
4133       if (loop_dump_stream)
4134         fprintf (loop_dump_stream, "Prefetch: ignoring loop: has call.\n");
4135
4136       return;
4137     }
4138
4139   /* Don't prefetch in loops known to have few iterations.  */
4140   if (PREFETCH_NO_LOW_LOOPCNT
4141       && LOOP_INFO (loop)->n_iterations
4142       && LOOP_INFO (loop)->n_iterations <= PREFETCH_LOW_LOOPCNT)
4143     {
4144       if (loop_dump_stream)
4145         fprintf (loop_dump_stream,
4146                  "Prefetch: ignoring loop: not enough iterations.\n");
4147       return;
4148     }
4149
4150   /* Search all induction variables and pick those interesting for the prefetch
4151      machinery.  */
4152   for (bl = ivs->list; bl; bl = bl->next)
4153     {
4154       struct induction *biv = bl->biv, *biv1;
4155       int basestride = 0;
4156
4157       biv1 = biv;
4158
4159       /* Expect all BIVs to be executed in each iteration.  This makes our
4160          analysis more conservative.  */
4161       while (biv1)
4162         {
4163           /* Discard non-constant additions that we can't handle well yet, and
4164              BIVs that are executed multiple times; such BIVs ought to be
4165              handled in the nested loop.  We accept not_every_iteration BIVs,
4166              since these only result in larger strides and make our
4167              heuristics more conservative.  */
4168           if (GET_CODE (biv->add_val) != CONST_INT)
4169             {
4170               if (loop_dump_stream)
4171                 {
4172                   fprintf (loop_dump_stream,
4173                     "Prefetch: ignoring biv %d: non-constant addition at insn %d:",
4174                            REGNO (biv->src_reg), INSN_UID (biv->insn));
4175                   print_rtl (loop_dump_stream, biv->add_val);
4176                   fprintf (loop_dump_stream, "\n");
4177                 }
4178               break;
4179             }
4180
4181           if (biv->maybe_multiple)
4182             {
4183               if (loop_dump_stream)
4184                 {
4185                   fprintf (loop_dump_stream,
4186                            "Prefetch: ignoring biv %d: maybe_multiple at insn %i:",
4187                            REGNO (biv->src_reg), INSN_UID (biv->insn));
4188                   print_rtl (loop_dump_stream, biv->add_val);
4189                   fprintf (loop_dump_stream, "\n");
4190                 }
4191               break;
4192             }
4193
4194           basestride += INTVAL (biv1->add_val);
4195           biv1 = biv1->next_iv;
4196         }
4197
4198       if (biv1 || !basestride)
4199         continue;
4200
4201       for (iv = bl->giv; iv; iv = iv->next_iv)
4202         {
4203           rtx address;
4204           rtx temp;
4205           HOST_WIDE_INT index = 0;
4206           int add = 1;
4207           HOST_WIDE_INT stride = 0;
4208           int stride_sign = 1;
4209           struct check_store_data d;
4210           const char *ignore_reason = NULL;
4211           int size = GET_MODE_SIZE (GET_MODE (iv));
4212
4213           /* See whether an induction variable is interesting to us and if
4214              not, report the reason.  */
4215           if (iv->giv_type != DEST_ADDR)
4216             ignore_reason = "giv is not a destination address";
4217
4218           /* We are interested only in constant stride memory references
4219              in order to be able to compute density easily.  */
4220           else if (GET_CODE (iv->mult_val) != CONST_INT)
4221             ignore_reason = "stride is not constant";
4222
4223           else
4224             {
4225               stride = INTVAL (iv->mult_val) * basestride;
4226               if (stride < 0)
4227                 {
4228                   stride = -stride;
4229                   stride_sign = -1;
4230                 }
4231
4232               /* On some targets, reversed order prefetches are not
4233                  worthwhile.  */
4234               if (PREFETCH_NO_REVERSE_ORDER && stride_sign < 0)
4235                 ignore_reason = "reversed order stride";
4236
4237               /* Prefetch of accesses with an extreme stride might not be
4238                  worthwhile, either.  */
4239               else if (PREFETCH_NO_EXTREME_STRIDE
4240                        && stride > PREFETCH_EXTREME_STRIDE)
4241                 ignore_reason = "extreme stride";
4242
4243               /* Ignore GIVs with varying add values; we can't predict the
4244                  value for the next iteration.  */
4245               else if (!loop_invariant_p (loop, iv->add_val))
4246                 ignore_reason = "giv has varying add value";
4247
4248               /* Ignore GIVs in the nested loops; they ought to have been
4249                  handled already.  */
4250               else if (iv->maybe_multiple)
4251                 ignore_reason = "giv is in nested loop";
4252             }
4253
4254           if (ignore_reason != NULL)
4255             {
4256               if (loop_dump_stream)
4257                 fprintf (loop_dump_stream,
4258                          "Prefetch: ignoring giv at %d: %s.\n",
4259                          INSN_UID (iv->insn), ignore_reason);
4260               continue;
4261             }
4262
4263           /* Determine the pointer to the basic array we are examining.  It is
4264              the sum of the BIV's initial value and the GIV's add_val.  */
4265           address = copy_rtx (iv->add_val);
4266           temp = copy_rtx (bl->initial_value);
4267
4268           address = simplify_gen_binary (PLUS, Pmode, temp, address);
4269           index = remove_constant_addition (&address);
4270
4271           d.mem_write = 0;
4272           d.mem_address = *iv->location;
4273
4274           /* When the GIV is not always executed, we might be better off by
4275              not dirtying the cache pages.  */
4276           if (PREFETCH_CONDITIONAL || iv->always_executed)
4277             note_stores (PATTERN (iv->insn), check_store, &d);
4278           else
4279             {
4280               if (loop_dump_stream)
4281                 fprintf (loop_dump_stream, "Prefetch: Ignoring giv at %d: %s\n",
4282                          INSN_UID (iv->insn), "in conditional code.");
4283               continue;
4284             }
4285
4286           /* Attempt to find another prefetch to the same array and see if we
4287              can merge this one.  */
4288           for (i = 0; i < num_prefetches; i++)
4289             if (rtx_equal_for_prefetch_p (address, info[i].base_address)
4290                 && stride == info[i].stride)
4291               {
4292                 /* In case both access same array (same location
4293                    just with small difference in constant indexes), merge
4294                    the prefetches.  Just do the later and the earlier will
4295                    get prefetched from previous iteration.
4296                    The artificial threshold should not be too small,
4297                    but also not bigger than small portion of memory usually
4298                    traversed by single loop.  */
4299                 if (index >= info[i].index
4300                     && index - info[i].index < PREFETCH_EXTREME_DIFFERENCE)
4301                   {
4302                     info[i].write |= d.mem_write;
4303                     info[i].bytes_accessed += size;
4304                     info[i].index = index;
4305                     info[i].giv = iv;
4306                     info[i].class = bl;
4307                     info[num_prefetches].base_address = address;
4308                     add = 0;
4309                     break;
4310                   }
4311
4312                 if (index < info[i].index
4313                     && info[i].index - index < PREFETCH_EXTREME_DIFFERENCE)
4314                   {
4315                     info[i].write |= d.mem_write;
4316                     info[i].bytes_accessed += size;
4317                     add = 0;
4318                     break;
4319                   }
4320               }
4321
4322           /* Merging failed.  */
4323           if (add)
4324             {
4325               info[num_prefetches].giv = iv;
4326               info[num_prefetches].class = bl;
4327               info[num_prefetches].index = index;
4328               info[num_prefetches].stride = stride;
4329               info[num_prefetches].base_address = address;
4330               info[num_prefetches].write = d.mem_write;
4331               info[num_prefetches].bytes_accessed = size;
4332               num_prefetches++;
4333               if (num_prefetches >= MAX_PREFETCHES)
4334                 {
4335                   if (loop_dump_stream)
4336                     fprintf (loop_dump_stream,
4337                              "Maximal number of prefetches exceeded.\n");
4338                   return;
4339                 }
4340             }
4341         }
4342     }
4343
4344   for (i = 0; i < num_prefetches; i++)
4345     {
4346       int density;
4347
4348       /* Attempt to calculate the total number of bytes fetched by all
4349          iterations of the loop.  Avoid overflow.  */
4350       if (LOOP_INFO (loop)->n_iterations
4351           && ((unsigned HOST_WIDE_INT) (0xffffffff / info[i].stride)
4352               >= LOOP_INFO (loop)->n_iterations))
4353         info[i].total_bytes = info[i].stride * LOOP_INFO (loop)->n_iterations;
4354       else
4355         info[i].total_bytes = 0xffffffff;
4356
4357       density = info[i].bytes_accessed * 100 / info[i].stride;
4358
4359       /* Prefetch might be worthwhile only when the loads/stores are dense.  */
4360       if (PREFETCH_ONLY_DENSE_MEM)
4361         if (density * 256 > PREFETCH_DENSE_MEM * 100
4362             && (info[i].total_bytes / PREFETCH_BLOCK
4363                 >= PREFETCH_BLOCKS_BEFORE_LOOP_MIN))
4364           {
4365             info[i].prefetch_before_loop = 1;
4366             info[i].prefetch_in_loop
4367               = (info[i].total_bytes / PREFETCH_BLOCK
4368                  > PREFETCH_BLOCKS_BEFORE_LOOP_MAX);
4369           }
4370         else
4371           {
4372             info[i].prefetch_in_loop = 0, info[i].prefetch_before_loop = 0;
4373             if (loop_dump_stream)
4374               fprintf (loop_dump_stream,
4375                   "Prefetch: ignoring giv at %d: %d%% density is too low.\n",
4376                        INSN_UID (info[i].giv->insn), density);
4377           }
4378       else
4379         info[i].prefetch_in_loop = 1, info[i].prefetch_before_loop = 1;
4380
4381       /* Find how many prefetch instructions we'll use within the loop.  */
4382       if (info[i].prefetch_in_loop != 0)
4383         {
4384           info[i].prefetch_in_loop = ((info[i].stride + PREFETCH_BLOCK - 1)
4385                                   / PREFETCH_BLOCK);
4386           num_real_prefetches += info[i].prefetch_in_loop;
4387           if (info[i].write)
4388             num_real_write_prefetches += info[i].prefetch_in_loop;
4389         }
4390     }
4391
4392   /* Determine how many iterations ahead to prefetch within the loop, based
4393      on how many prefetches we currently expect to do within the loop.  */
4394   if (num_real_prefetches != 0)
4395     {
4396       if ((ahead = SIMULTANEOUS_PREFETCHES / num_real_prefetches) == 0)
4397         {
4398           if (loop_dump_stream)
4399             fprintf (loop_dump_stream,
4400                      "Prefetch: ignoring prefetches within loop: ahead is zero; %d < %d\n",
4401                      SIMULTANEOUS_PREFETCHES, num_real_prefetches);
4402           num_real_prefetches = 0, num_real_write_prefetches = 0;
4403         }
4404     }
4405   /* We'll also use AHEAD to determine how many prefetch instructions to
4406      emit before a loop, so don't leave it zero.  */
4407   if (ahead == 0)
4408     ahead = PREFETCH_BLOCKS_BEFORE_LOOP_MAX;
4409
4410   for (i = 0; i < num_prefetches; i++)
4411     {
4412       /* Update if we've decided not to prefetch anything within the loop.  */
4413       if (num_real_prefetches == 0)
4414         info[i].prefetch_in_loop = 0;
4415
4416       /* Find how many prefetch instructions we'll use before the loop.  */
4417       if (info[i].prefetch_before_loop != 0)
4418         {
4419           int n = info[i].total_bytes / PREFETCH_BLOCK;
4420           if (n > ahead)
4421             n = ahead;
4422           info[i].prefetch_before_loop = n;
4423           num_prefetches_before += n;
4424           if (info[i].write)
4425             num_write_prefetches_before += n;
4426         }
4427
4428       if (loop_dump_stream)
4429         {
4430           if (info[i].prefetch_in_loop == 0
4431               && info[i].prefetch_before_loop == 0)
4432             continue;
4433           fprintf (loop_dump_stream, "Prefetch insn: %d",
4434                    INSN_UID (info[i].giv->insn));
4435           fprintf (loop_dump_stream,
4436                    "; in loop: %d; before: %d; %s\n",
4437                    info[i].prefetch_in_loop,
4438                    info[i].prefetch_before_loop,
4439                    info[i].write ? "read/write" : "read only");
4440           fprintf (loop_dump_stream,
4441                    " density: %d%%; bytes_accessed: %u; total_bytes: %u\n",
4442                    (int) (info[i].bytes_accessed * 100 / info[i].stride),
4443                    info[i].bytes_accessed, info[i].total_bytes);
4444           fprintf (loop_dump_stream, " index: " HOST_WIDE_INT_PRINT_DEC
4445                    "; stride: " HOST_WIDE_INT_PRINT_DEC "; address: ",
4446                    info[i].index, info[i].stride);
4447           print_rtl (loop_dump_stream, info[i].base_address);
4448           fprintf (loop_dump_stream, "\n");
4449         }
4450     }
4451
4452   if (num_real_prefetches + num_prefetches_before > 0)
4453     {
4454       /* Record that this loop uses prefetch instructions.  */
4455       LOOP_INFO (loop)->has_prefetch = 1;
4456
4457       if (loop_dump_stream)
4458         {
4459           fprintf (loop_dump_stream, "Real prefetches needed within loop: %d (write: %d)\n",
4460                    num_real_prefetches, num_real_write_prefetches);
4461           fprintf (loop_dump_stream, "Real prefetches needed before loop: %d (write: %d)\n",
4462                    num_prefetches_before, num_write_prefetches_before);
4463         }
4464     }
4465
4466   for (i = 0; i < num_prefetches; i++)
4467     {
4468       int y;
4469
4470       for (y = 0; y < info[i].prefetch_in_loop; y++)
4471         {
4472           rtx loc = copy_rtx (*info[i].giv->location);
4473           rtx insn;
4474           int bytes_ahead = PREFETCH_BLOCK * (ahead + y);
4475           rtx before_insn = info[i].giv->insn;
4476           rtx prev_insn = PREV_INSN (info[i].giv->insn);
4477           rtx seq;
4478
4479           /* We can save some effort by offsetting the address on
4480              architectures with offsettable memory references.  */
4481           if (offsettable_address_p (0, VOIDmode, loc))
4482             loc = plus_constant (loc, bytes_ahead);
4483           else
4484             {
4485               rtx reg = gen_reg_rtx (Pmode);
4486               loop_iv_add_mult_emit_before (loop, loc, const1_rtx,
4487                                             GEN_INT (bytes_ahead), reg,
4488                                             0, before_insn);
4489               loc = reg;
4490             }
4491
4492           start_sequence ();
4493           /* Make sure the address operand is valid for prefetch.  */
4494           if (! (*insn_data[(int)CODE_FOR_prefetch].operand[0].predicate)
4495                   (loc, insn_data[(int)CODE_FOR_prefetch].operand[0].mode))
4496             loc = force_reg (Pmode, loc);
4497           emit_insn (gen_prefetch (loc, GEN_INT (info[i].write),
4498                                    GEN_INT (3)));
4499           seq = get_insns ();
4500           end_sequence ();
4501           emit_insn_before (seq, before_insn);
4502
4503           /* Check all insns emitted and record the new GIV
4504              information.  */
4505           insn = NEXT_INSN (prev_insn);
4506           while (insn != before_insn)
4507             {
4508               insn = check_insn_for_givs (loop, insn,
4509                                           info[i].giv->always_executed,
4510                                           info[i].giv->maybe_multiple);
4511               insn = NEXT_INSN (insn);
4512             }
4513         }
4514
4515       if (PREFETCH_BEFORE_LOOP)
4516         {
4517           /* Emit insns before the loop to fetch the first cache lines or,
4518              if we're not prefetching within the loop, everything we expect
4519              to need.  */
4520           for (y = 0; y < info[i].prefetch_before_loop; y++)
4521             {
4522               rtx reg = gen_reg_rtx (Pmode);
4523               rtx loop_start = loop->start;
4524               rtx init_val = info[i].class->initial_value;
4525               rtx add_val = simplify_gen_binary (PLUS, Pmode,
4526                                                  info[i].giv->add_val,
4527                                                  GEN_INT (y * PREFETCH_BLOCK));
4528
4529               /* Functions called by LOOP_IV_ADD_EMIT_BEFORE expect a
4530                  non-constant INIT_VAL to have the same mode as REG, which
4531                  in this case we know to be Pmode.  */
4532               if (GET_MODE (init_val) != Pmode && !CONSTANT_P (init_val))
4533                 {
4534                   rtx seq;
4535
4536                   start_sequence ();
4537                   init_val = convert_to_mode (Pmode, init_val, 0);
4538                   seq = get_insns ();
4539                   end_sequence ();
4540                   loop_insn_emit_before (loop, 0, loop_start, seq);
4541                 }
4542               loop_iv_add_mult_emit_before (loop, init_val,
4543                                             info[i].giv->mult_val,
4544                                             add_val, reg, 0, loop_start);
4545               emit_insn_before (gen_prefetch (reg, GEN_INT (info[i].write),
4546                                               GEN_INT (3)),
4547                                 loop_start);
4548             }
4549         }
4550     }
4551
4552   return;
4553 }
4554 \f
4555 /* Communication with routines called via `note_stores'.  */
4556
4557 static rtx note_insn;
4558
4559 /* Dummy register to have nonzero DEST_REG for DEST_ADDR type givs.  */
4560
4561 static rtx addr_placeholder;
4562
4563 /* ??? Unfinished optimizations, and possible future optimizations,
4564    for the strength reduction code.  */
4565
4566 /* ??? The interaction of biv elimination, and recognition of 'constant'
4567    bivs, may cause problems.  */
4568
4569 /* ??? Add heuristics so that DEST_ADDR strength reduction does not cause
4570    performance problems.
4571
4572    Perhaps don't eliminate things that can be combined with an addressing
4573    mode.  Find all givs that have the same biv, mult_val, and add_val;
4574    then for each giv, check to see if its only use dies in a following
4575    memory address.  If so, generate a new memory address and check to see
4576    if it is valid.   If it is valid, then store the modified memory address,
4577    otherwise, mark the giv as not done so that it will get its own iv.  */
4578
4579 /* ??? Could try to optimize branches when it is known that a biv is always
4580    positive.  */
4581
4582 /* ??? When replace a biv in a compare insn, we should replace with closest
4583    giv so that an optimized branch can still be recognized by the combiner,
4584    e.g. the VAX acb insn.  */
4585
4586 /* ??? Many of the checks involving uid_luid could be simplified if regscan
4587    was rerun in loop_optimize whenever a register was added or moved.
4588    Also, some of the optimizations could be a little less conservative.  */
4589 \f
4590 /* Searches the insns between INSN and LOOP->END.  Returns 1 if there
4591    is a backward branch in that range that branches to somewhere between
4592    LOOP->START and INSN.  Returns 0 otherwise.  */
4593
4594 /* ??? This is quadratic algorithm.  Could be rewritten to be linear.
4595    In practice, this is not a problem, because this function is seldom called,
4596    and uses a negligible amount of CPU time on average.  */
4597
4598 static int
4599 back_branch_in_range_p (const struct loop *loop, rtx insn)
4600 {
4601   rtx p, q, target_insn;
4602   rtx loop_start = loop->start;
4603   rtx loop_end = loop->end;
4604   rtx orig_loop_end = loop->end;
4605
4606   /* Stop before we get to the backward branch at the end of the loop.  */
4607   loop_end = prev_nonnote_insn (loop_end);
4608   if (BARRIER_P (loop_end))
4609     loop_end = PREV_INSN (loop_end);
4610
4611   /* Check in case insn has been deleted, search forward for first non
4612      deleted insn following it.  */
4613   while (INSN_DELETED_P (insn))
4614     insn = NEXT_INSN (insn);
4615
4616   /* Check for the case where insn is the last insn in the loop.  Deal
4617      with the case where INSN was a deleted loop test insn, in which case
4618      it will now be the NOTE_LOOP_END.  */
4619   if (insn == loop_end || insn == orig_loop_end)
4620     return 0;
4621
4622   for (p = NEXT_INSN (insn); p != loop_end; p = NEXT_INSN (p))
4623     {
4624       if (JUMP_P (p))
4625         {
4626           target_insn = JUMP_LABEL (p);
4627
4628           /* Search from loop_start to insn, to see if one of them is
4629              the target_insn.  We can't use INSN_LUID comparisons here,
4630              since insn may not have an LUID entry.  */
4631           for (q = loop_start; q != insn; q = NEXT_INSN (q))
4632             if (q == target_insn)
4633               return 1;
4634         }
4635     }
4636
4637   return 0;
4638 }
4639
4640 /* Scan the loop body and call FNCALL for each insn.  In the addition to the
4641    LOOP and INSN parameters pass MAYBE_MULTIPLE and NOT_EVERY_ITERATION to the
4642    callback.
4643
4644    NOT_EVERY_ITERATION is 1 if current insn is not known to be executed at
4645    least once for every loop iteration except for the last one.
4646
4647    MAYBE_MULTIPLE is 1 if current insn may be executed more than once for every
4648    loop iteration.
4649  */
4650 typedef rtx (*loop_insn_callback) (struct loop *, rtx, int, int);
4651 static void
4652 for_each_insn_in_loop (struct loop *loop, loop_insn_callback fncall)
4653 {
4654   int not_every_iteration = 0;
4655   int maybe_multiple = 0;
4656   int past_loop_latch = 0;
4657   bool exit_test_is_entry = false;
4658   rtx p;
4659
4660   /* If loop_scan_start points to the loop exit test, the loop body
4661      cannot be counted on running on every iteration, and we have to
4662      be wary of subversive use of gotos inside expression
4663      statements.  */
4664   if (prev_nonnote_insn (loop->scan_start) != prev_nonnote_insn (loop->start))
4665     {
4666       exit_test_is_entry = true;
4667       maybe_multiple = back_branch_in_range_p (loop, loop->scan_start);
4668     }
4669
4670   /* Scan through loop and update NOT_EVERY_ITERATION and MAYBE_MULTIPLE.  */
4671   for (p = next_insn_in_loop (loop, loop->scan_start);
4672        p != NULL_RTX;
4673        p = next_insn_in_loop (loop, p))
4674     {
4675       p = fncall (loop, p, not_every_iteration, maybe_multiple);
4676
4677       /* Past CODE_LABEL, we get to insns that may be executed multiple
4678          times.  The only way we can be sure that they can't is if every
4679          jump insn between here and the end of the loop either
4680          returns, exits the loop, is a jump to a location that is still
4681          behind the label, or is a jump to the loop start.  */
4682
4683       if (LABEL_P (p))
4684         {
4685           rtx insn = p;
4686
4687           maybe_multiple = 0;
4688
4689           while (1)
4690             {
4691               insn = NEXT_INSN (insn);
4692               if (insn == loop->scan_start)
4693                 break;
4694               if (insn == loop->end)
4695                 {
4696                   if (loop->top != 0)
4697                     insn = loop->top;
4698                   else
4699                     break;
4700                   if (insn == loop->scan_start)
4701                     break;
4702                 }
4703
4704               if (JUMP_P (insn)
4705                   && GET_CODE (PATTERN (insn)) != RETURN
4706                   && (!any_condjump_p (insn)
4707                       || (JUMP_LABEL (insn) != 0
4708                           && JUMP_LABEL (insn) != loop->scan_start
4709                           && !loop_insn_first_p (p, JUMP_LABEL (insn)))))
4710                 {
4711                   maybe_multiple = 1;
4712                   break;
4713                 }
4714             }
4715         }
4716
4717       /* Past a jump, we get to insns for which we can't count
4718          on whether they will be executed during each iteration.  */
4719       /* This code appears twice in strength_reduce.  There is also similar
4720          code in scan_loop.  */
4721       if (JUMP_P (p)
4722       /* If we enter the loop in the middle, and scan around to the
4723          beginning, don't set not_every_iteration for that.
4724          This can be any kind of jump, since we want to know if insns
4725          will be executed if the loop is executed.  */
4726           && (exit_test_is_entry
4727               || !(JUMP_LABEL (p) == loop->top
4728                    && ((NEXT_INSN (NEXT_INSN (p)) == loop->end
4729                         && any_uncondjump_p (p))
4730                        || (NEXT_INSN (p) == loop->end
4731                            && any_condjump_p (p))))))
4732         {
4733           rtx label = 0;
4734
4735           /* If this is a jump outside the loop, then it also doesn't
4736              matter.  Check to see if the target of this branch is on the
4737              loop->exits_labels list.  */
4738
4739           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
4740             if (XEXP (label, 0) == JUMP_LABEL (p))
4741               break;
4742
4743           if (!label)
4744             not_every_iteration = 1;
4745         }
4746
4747       /* Note if we pass a loop latch.  If we do, then we can not clear
4748          NOT_EVERY_ITERATION below when we pass the last CODE_LABEL in
4749          a loop since a jump before the last CODE_LABEL may have started
4750          a new loop iteration.
4751
4752          Note that LOOP_TOP is only set for rotated loops and we need
4753          this check for all loops, so compare against the CODE_LABEL
4754          which immediately follows LOOP_START.  */
4755       if (JUMP_P (p)
4756           && JUMP_LABEL (p) == NEXT_INSN (loop->start))
4757         past_loop_latch = 1;
4758
4759       /* Unlike in the code motion pass where MAYBE_NEVER indicates that
4760          an insn may never be executed, NOT_EVERY_ITERATION indicates whether
4761          or not an insn is known to be executed each iteration of the
4762          loop, whether or not any iterations are known to occur.
4763
4764          Therefore, if we have just passed a label and have no more labels
4765          between here and the test insn of the loop, and we have not passed
4766          a jump to the top of the loop, then we know these insns will be
4767          executed each iteration.  */
4768
4769       if (not_every_iteration
4770           && !past_loop_latch
4771           && LABEL_P (p)
4772           && no_labels_between_p (p, loop->end))
4773         not_every_iteration = 0;
4774     }
4775 }
4776 \f
4777 static void
4778 loop_bivs_find (struct loop *loop)
4779 {
4780   struct loop_regs *regs = LOOP_REGS (loop);
4781   struct loop_ivs *ivs = LOOP_IVS (loop);
4782   /* Temporary list pointers for traversing ivs->list.  */
4783   struct iv_class *bl, **backbl;
4784
4785   ivs->list = 0;
4786
4787   for_each_insn_in_loop (loop, check_insn_for_bivs);
4788
4789   /* Scan ivs->list to remove all regs that proved not to be bivs.
4790      Make a sanity check against regs->n_times_set.  */
4791   for (backbl = &ivs->list, bl = *backbl; bl; bl = bl->next)
4792     {
4793       if (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4794           /* Above happens if register modified by subreg, etc.  */
4795           /* Make sure it is not recognized as a basic induction var: */
4796           || regs->array[bl->regno].n_times_set != bl->biv_count
4797           /* If never incremented, it is invariant that we decided not to
4798              move.  So leave it alone.  */
4799           || ! bl->incremented)
4800         {
4801           if (loop_dump_stream)
4802             fprintf (loop_dump_stream, "Biv %d: discarded, %s\n",
4803                      bl->regno,
4804                      (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4805                       ? "not induction variable"
4806                       : (! bl->incremented ? "never incremented"
4807                          : "count error")));
4808
4809           REG_IV_TYPE (ivs, bl->regno) = NOT_BASIC_INDUCT;
4810           *backbl = bl->next;
4811         }
4812       else
4813         {
4814           backbl = &bl->next;
4815
4816           if (loop_dump_stream)
4817             fprintf (loop_dump_stream, "Biv %d: verified\n", bl->regno);
4818         }
4819     }
4820 }
4821
4822
4823 /* Determine how BIVS are initialized by looking through pre-header
4824    extended basic block.  */
4825 static void
4826 loop_bivs_init_find (struct loop *loop)
4827 {
4828   struct loop_ivs *ivs = LOOP_IVS (loop);
4829   /* Temporary list pointers for traversing ivs->list.  */
4830   struct iv_class *bl;
4831   int call_seen;
4832   rtx p;
4833
4834   /* Find initial value for each biv by searching backwards from loop_start,
4835      halting at first label.  Also record any test condition.  */
4836
4837   call_seen = 0;
4838   for (p = loop->start; p && !LABEL_P (p); p = PREV_INSN (p))
4839     {
4840       rtx test;
4841
4842       note_insn = p;
4843
4844       if (CALL_P (p))
4845         call_seen = 1;
4846
4847       if (INSN_P (p))
4848         note_stores (PATTERN (p), record_initial, ivs);
4849
4850       /* Record any test of a biv that branches around the loop if no store
4851          between it and the start of loop.  We only care about tests with
4852          constants and registers and only certain of those.  */
4853       if (JUMP_P (p)
4854           && JUMP_LABEL (p) != 0
4855           && next_real_insn (JUMP_LABEL (p)) == next_real_insn (loop->end)
4856           && (test = get_condition_for_loop (loop, p)) != 0
4857           && REG_P (XEXP (test, 0))
4858           && REGNO (XEXP (test, 0)) < max_reg_before_loop
4859           && (bl = REG_IV_CLASS (ivs, REGNO (XEXP (test, 0)))) != 0
4860           && valid_initial_value_p (XEXP (test, 1), p, call_seen, loop->start)
4861           && bl->init_insn == 0)
4862         {
4863           /* If an NE test, we have an initial value!  */
4864           if (GET_CODE (test) == NE)
4865             {
4866               bl->init_insn = p;
4867               bl->init_set = gen_rtx_SET (VOIDmode,
4868                                           XEXP (test, 0), XEXP (test, 1));
4869             }
4870           else
4871             bl->initial_test = test;
4872         }
4873     }
4874 }
4875
4876
4877 /* Look at the each biv and see if we can say anything better about its
4878    initial value from any initializing insns set up above.  (This is done
4879    in two passes to avoid missing SETs in a PARALLEL.)  */
4880 static void
4881 loop_bivs_check (struct loop *loop)
4882 {
4883   struct loop_ivs *ivs = LOOP_IVS (loop);
4884   /* Temporary list pointers for traversing ivs->list.  */
4885   struct iv_class *bl;
4886   struct iv_class **backbl;
4887
4888   for (backbl = &ivs->list; (bl = *backbl); backbl = &bl->next)
4889     {
4890       rtx src;
4891       rtx note;
4892
4893       if (! bl->init_insn)
4894         continue;
4895
4896       /* IF INIT_INSN has a REG_EQUAL or REG_EQUIV note and the value
4897          is a constant, use the value of that.  */
4898       if (((note = find_reg_note (bl->init_insn, REG_EQUAL, 0)) != NULL
4899            && CONSTANT_P (XEXP (note, 0)))
4900           || ((note = find_reg_note (bl->init_insn, REG_EQUIV, 0)) != NULL
4901               && CONSTANT_P (XEXP (note, 0))))
4902         src = XEXP (note, 0);
4903       else
4904         src = SET_SRC (bl->init_set);
4905
4906       if (loop_dump_stream)
4907         fprintf (loop_dump_stream,
4908                  "Biv %d: initialized at insn %d: initial value ",
4909                  bl->regno, INSN_UID (bl->init_insn));
4910
4911       if ((GET_MODE (src) == GET_MODE (regno_reg_rtx[bl->regno])
4912            || GET_MODE (src) == VOIDmode)
4913           && valid_initial_value_p (src, bl->init_insn,
4914                                     LOOP_INFO (loop)->pre_header_has_call,
4915                                     loop->start))
4916         {
4917           bl->initial_value = src;
4918
4919           if (loop_dump_stream)
4920             {
4921               print_simple_rtl (loop_dump_stream, src);
4922               fputc ('\n', loop_dump_stream);
4923             }
4924         }
4925       /* If we can't make it a giv,
4926          let biv keep initial value of "itself".  */
4927       else if (loop_dump_stream)
4928         fprintf (loop_dump_stream, "is complex\n");
4929     }
4930 }
4931
4932
4933 /* Search the loop for general induction variables.  */
4934
4935 static void
4936 loop_givs_find (struct loop* loop)
4937 {
4938   for_each_insn_in_loop (loop, check_insn_for_givs);
4939 }
4940
4941
4942 /* For each giv for which we still don't know whether or not it is
4943    replaceable, check to see if it is replaceable because its final value
4944    can be calculated.  */
4945
4946 static void
4947 loop_givs_check (struct loop *loop)
4948 {
4949   struct loop_ivs *ivs = LOOP_IVS (loop);
4950   struct iv_class *bl;
4951
4952   for (bl = ivs->list; bl; bl = bl->next)
4953     {
4954       struct induction *v;
4955
4956       for (v = bl->giv; v; v = v->next_iv)
4957         if (! v->replaceable && ! v->not_replaceable)
4958           check_final_value (loop, v);
4959     }
4960 }
4961
4962 /* Try to generate the simplest rtx for the expression
4963    (PLUS (MULT mult1 mult2) add1).  This is used to calculate the initial
4964    value of giv's.  */
4965
4966 static rtx
4967 fold_rtx_mult_add (rtx mult1, rtx mult2, rtx add1, enum machine_mode mode)
4968 {
4969   rtx temp, mult_res;
4970   rtx result;
4971
4972   /* The modes must all be the same.  This should always be true.  For now,
4973      check to make sure.  */
4974   gcc_assert (GET_MODE (mult1) == mode || GET_MODE (mult1) == VOIDmode);
4975   gcc_assert (GET_MODE (mult2) == mode || GET_MODE (mult2) == VOIDmode);
4976   gcc_assert (GET_MODE (add1) == mode || GET_MODE (add1) == VOIDmode);
4977
4978   /* Ensure that if at least one of mult1/mult2 are constant, then mult2
4979      will be a constant.  */
4980   if (GET_CODE (mult1) == CONST_INT)
4981     {
4982       temp = mult2;
4983       mult2 = mult1;
4984       mult1 = temp;
4985     }
4986
4987   mult_res = simplify_binary_operation (MULT, mode, mult1, mult2);
4988   if (! mult_res)
4989     mult_res = gen_rtx_MULT (mode, mult1, mult2);
4990
4991   /* Again, put the constant second.  */
4992   if (GET_CODE (add1) == CONST_INT)
4993     {
4994       temp = add1;
4995       add1 = mult_res;
4996       mult_res = temp;
4997     }
4998
4999   result = simplify_binary_operation (PLUS, mode, add1, mult_res);
5000   if (! result)
5001     result = gen_rtx_PLUS (mode, add1, mult_res);
5002
5003   return result;
5004 }
5005
5006 /* Searches the list of induction struct's for the biv BL, to try to calculate
5007    the total increment value for one iteration of the loop as a constant.
5008
5009    Returns the increment value as an rtx, simplified as much as possible,
5010    if it can be calculated.  Otherwise, returns 0.  */
5011
5012 static rtx
5013 biv_total_increment (const struct iv_class *bl)
5014 {
5015   struct induction *v;
5016   rtx result;
5017
5018   /* For increment, must check every instruction that sets it.  Each
5019      instruction must be executed only once each time through the loop.
5020      To verify this, we check that the insn is always executed, and that
5021      there are no backward branches after the insn that branch to before it.
5022      Also, the insn must have a mult_val of one (to make sure it really is
5023      an increment).  */
5024
5025   result = const0_rtx;
5026   for (v = bl->biv; v; v = v->next_iv)
5027     {
5028       if (v->always_computable && v->mult_val == const1_rtx
5029           && ! v->maybe_multiple
5030           && SCALAR_INT_MODE_P (v->mode))
5031         {
5032           /* If we have already counted it, skip it.  */
5033           if (v->same)
5034             continue;
5035
5036           result = fold_rtx_mult_add (result, const1_rtx, v->add_val, v->mode);
5037         }
5038       else
5039         return 0;
5040     }
5041
5042   return result;
5043 }
5044
5045 /* Try to prove that the register is dead after the loop exits.  Trace every
5046    loop exit looking for an insn that will always be executed, which sets
5047    the register to some value, and appears before the first use of the register
5048    is found.  If successful, then return 1, otherwise return 0.  */
5049
5050 /* ?? Could be made more intelligent in the handling of jumps, so that
5051    it can search past if statements and other similar structures.  */
5052
5053 static int
5054 reg_dead_after_loop (const struct loop *loop, rtx reg)
5055 {
5056   rtx insn, label;
5057   int jump_count = 0;
5058   int label_count = 0;
5059
5060   /* In addition to checking all exits of this loop, we must also check
5061      all exits of inner nested loops that would exit this loop.  We don't
5062      have any way to identify those, so we just give up if there are any
5063      such inner loop exits.  */
5064
5065   for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
5066     label_count++;
5067
5068   if (label_count != loop->exit_count)
5069     return 0;
5070
5071   /* HACK: Must also search the loop fall through exit, create a label_ref
5072      here which points to the loop->end, and append the loop_number_exit_labels
5073      list to it.  */
5074   label = gen_rtx_LABEL_REF (VOIDmode, loop->end);
5075   LABEL_NEXTREF (label) = loop->exit_labels;
5076
5077   for (; label; label = LABEL_NEXTREF (label))
5078     {
5079       /* Succeed if find an insn which sets the biv or if reach end of
5080          function.  Fail if find an insn that uses the biv, or if come to
5081          a conditional jump.  */
5082
5083       insn = NEXT_INSN (XEXP (label, 0));
5084       while (insn)
5085         {
5086           if (INSN_P (insn))
5087             {
5088               rtx set, note;
5089
5090               if (reg_referenced_p (reg, PATTERN (insn)))
5091                 return 0;
5092
5093               note = find_reg_equal_equiv_note (insn);
5094               if (note && reg_overlap_mentioned_p (reg, XEXP (note, 0)))
5095                 return 0;
5096
5097               set = single_set (insn);
5098               if (set && rtx_equal_p (SET_DEST (set), reg))
5099                 break;
5100
5101               if (JUMP_P (insn))
5102                 {
5103                   if (GET_CODE (PATTERN (insn)) == RETURN)
5104                     break;
5105                   else if (!any_uncondjump_p (insn)
5106                            /* Prevent infinite loop following infinite loops.  */
5107                            || jump_count++ > 20)
5108                     return 0;
5109                   else
5110                     insn = JUMP_LABEL (insn);
5111                 }
5112             }
5113
5114           insn = NEXT_INSN (insn);
5115         }
5116     }
5117
5118   /* Success, the register is dead on all loop exits.  */
5119   return 1;
5120 }
5121
5122 /* Try to calculate the final value of the biv, the value it will have at
5123    the end of the loop.  If we can do it, return that value.  */
5124
5125 static rtx
5126 final_biv_value (const struct loop *loop, struct iv_class *bl)
5127 {
5128   unsigned HOST_WIDE_INT n_iterations = LOOP_INFO (loop)->n_iterations;
5129   rtx increment, tem;
5130
5131   /* ??? This only works for MODE_INT biv's.  Reject all others for now.  */
5132
5133   if (GET_MODE_CLASS (bl->biv->mode) != MODE_INT)
5134     return 0;
5135
5136   /* The final value for reversed bivs must be calculated differently than
5137      for ordinary bivs.  In this case, there is already an insn after the
5138      loop which sets this biv's final value (if necessary), and there are
5139      no other loop exits, so we can return any value.  */
5140   if (bl->reversed)
5141     {
5142       if (loop_dump_stream)
5143         fprintf (loop_dump_stream,
5144                  "Final biv value for %d, reversed biv.\n", bl->regno);
5145
5146       return const0_rtx;
5147     }
5148
5149   /* Try to calculate the final value as initial value + (number of iterations
5150      * increment).  For this to work, increment must be invariant, the only
5151      exit from the loop must be the fall through at the bottom (otherwise
5152      it may not have its final value when the loop exits), and the initial
5153      value of the biv must be invariant.  */
5154
5155   if (n_iterations != 0
5156       && ! loop->exit_count
5157       && loop_invariant_p (loop, bl->initial_value))
5158     {
5159       increment = biv_total_increment (bl);
5160
5161       if (increment && loop_invariant_p (loop, increment))
5162         {
5163           /* Can calculate the loop exit value, emit insns after loop
5164              end to calculate this value into a temporary register in
5165              case it is needed later.  */
5166
5167           tem = gen_reg_rtx (bl->biv->mode);
5168           record_base_value (REGNO (tem), bl->biv->add_val, 0);
5169           loop_iv_add_mult_sink (loop, increment, GEN_INT (n_iterations),
5170                                  bl->initial_value, tem);
5171
5172           if (loop_dump_stream)
5173             fprintf (loop_dump_stream,
5174                      "Final biv value for %d, calculated.\n", bl->regno);
5175
5176           return tem;
5177         }
5178     }
5179
5180   /* Check to see if the biv is dead at all loop exits.  */
5181   if (reg_dead_after_loop (loop, bl->biv->src_reg))
5182     {
5183       if (loop_dump_stream)
5184         fprintf (loop_dump_stream,
5185                  "Final biv value for %d, biv dead after loop exit.\n",
5186                  bl->regno);
5187
5188       return const0_rtx;
5189     }
5190
5191   return 0;
5192 }
5193
5194 /* Return nonzero if it is possible to eliminate the biv BL provided
5195    all givs are reduced.  This is possible if either the reg is not
5196    used outside the loop, or we can compute what its final value will
5197    be.  */
5198
5199 static int
5200 loop_biv_eliminable_p (struct loop *loop, struct iv_class *bl,
5201                        int threshold, int insn_count)
5202 {
5203   /* For architectures with a decrement_and_branch_until_zero insn,
5204      don't do this if we put a REG_NONNEG note on the endtest for this
5205      biv.  */
5206
5207 #ifdef HAVE_decrement_and_branch_until_zero
5208   if (bl->nonneg)
5209     {
5210       if (loop_dump_stream)
5211         fprintf (loop_dump_stream,
5212                  "Cannot eliminate nonneg biv %d.\n", bl->regno);
5213       return 0;
5214     }
5215 #endif
5216
5217   /* Check that biv is used outside loop or if it has a final value.
5218      Compare against bl->init_insn rather than loop->start.  We aren't
5219      concerned with any uses of the biv between init_insn and
5220      loop->start since these won't be affected by the value of the biv
5221      elsewhere in the function, so long as init_insn doesn't use the
5222      biv itself.  */
5223
5224   if ((REGNO_LAST_LUID (bl->regno) < INSN_LUID (loop->end)
5225        && bl->init_insn
5226        && INSN_UID (bl->init_insn) < max_uid_for_loop
5227        && REGNO_FIRST_LUID (bl->regno) >= INSN_LUID (bl->init_insn)
5228        && ! reg_mentioned_p (bl->biv->dest_reg, SET_SRC (bl->init_set)))
5229       || (bl->final_value = final_biv_value (loop, bl)))
5230     return maybe_eliminate_biv (loop, bl, 0, threshold, insn_count);
5231
5232   if (loop_dump_stream)
5233     {
5234       fprintf (loop_dump_stream,
5235                "Cannot eliminate biv %d.\n",
5236                bl->regno);
5237       fprintf (loop_dump_stream,
5238                "First use: insn %d, last use: insn %d.\n",
5239                REGNO_FIRST_UID (bl->regno),
5240                REGNO_LAST_UID (bl->regno));
5241     }
5242   return 0;
5243 }
5244
5245
5246 /* Reduce each giv of BL that we have decided to reduce.  */
5247
5248 static void
5249 loop_givs_reduce (struct loop *loop, struct iv_class *bl)
5250 {
5251   struct induction *v;
5252
5253   for (v = bl->giv; v; v = v->next_iv)
5254     {
5255       struct induction *tv;
5256       if (! v->ignore && v->same == 0)
5257         {
5258           int auto_inc_opt = 0;
5259
5260           /* If the code for derived givs immediately below has already
5261              allocated a new_reg, we must keep it.  */
5262           if (! v->new_reg)
5263             v->new_reg = gen_reg_rtx (v->mode);
5264
5265 #ifdef AUTO_INC_DEC
5266           /* If the target has auto-increment addressing modes, and
5267              this is an address giv, then try to put the increment
5268              immediately after its use, so that flow can create an
5269              auto-increment addressing mode.  */
5270           /* Don't do this for loops entered at the bottom, to avoid
5271              this invalid transformation:
5272                 jmp L;          ->          jmp L;
5273              TOP:                       TOP:
5274                 use giv                     use giv
5275              L:                             inc giv
5276                 inc biv                 L:
5277                 test biv                    test giv
5278                 cbr TOP                     cbr TOP
5279           */
5280           if (v->giv_type == DEST_ADDR && bl->biv_count == 1
5281               && bl->biv->always_executed && ! bl->biv->maybe_multiple
5282               /* We don't handle reversed biv's because bl->biv->insn
5283                  does not have a valid INSN_LUID.  */
5284               && ! bl->reversed
5285               && v->always_executed && ! v->maybe_multiple
5286               && INSN_UID (v->insn) < max_uid_for_loop
5287               && !loop->top)
5288             {
5289               /* If other giv's have been combined with this one, then
5290                  this will work only if all uses of the other giv's occur
5291                  before this giv's insn.  This is difficult to check.
5292
5293                  We simplify this by looking for the common case where
5294                  there is one DEST_REG giv, and this giv's insn is the
5295                  last use of the dest_reg of that DEST_REG giv.  If the
5296                  increment occurs after the address giv, then we can
5297                  perform the optimization.  (Otherwise, the increment
5298                  would have to go before other_giv, and we would not be
5299                  able to combine it with the address giv to get an
5300                  auto-inc address.)  */
5301               if (v->combined_with)
5302                 {
5303                   struct induction *other_giv = 0;
5304
5305                   for (tv = bl->giv; tv; tv = tv->next_iv)
5306                     if (tv->same == v)
5307                       {
5308                         if (other_giv)
5309                           break;
5310                         else
5311                           other_giv = tv;
5312                       }
5313                   if (! tv && other_giv
5314                       && REGNO (other_giv->dest_reg) < max_reg_before_loop
5315                       && (REGNO_LAST_UID (REGNO (other_giv->dest_reg))
5316                           == INSN_UID (v->insn))
5317                       && INSN_LUID (v->insn) < INSN_LUID (bl->biv->insn))
5318                     auto_inc_opt = 1;
5319                 }
5320               /* Check for case where increment is before the address
5321                  giv.  Do this test in "loop order".  */
5322               else if ((INSN_LUID (v->insn) > INSN_LUID (bl->biv->insn)
5323                         && (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
5324                             || (INSN_LUID (bl->biv->insn)
5325                                 > INSN_LUID (loop->scan_start))))
5326                        || (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
5327                            && (INSN_LUID (loop->scan_start)
5328                                < INSN_LUID (bl->biv->insn))))
5329                 auto_inc_opt = -1;
5330               else
5331                 auto_inc_opt = 1;
5332
5333 #ifdef HAVE_cc0
5334               {
5335                 rtx prev;
5336
5337                 /* We can't put an insn immediately after one setting
5338                    cc0, or immediately before one using cc0.  */
5339                 if ((auto_inc_opt == 1 && sets_cc0_p (PATTERN (v->insn)))
5340                     || (auto_inc_opt == -1
5341                         && (prev = prev_nonnote_insn (v->insn)) != 0
5342                         && INSN_P (prev)
5343                         && sets_cc0_p (PATTERN (prev))))
5344                   auto_inc_opt = 0;
5345               }
5346 #endif
5347
5348               if (auto_inc_opt)
5349                 v->auto_inc_opt = 1;
5350             }
5351 #endif
5352
5353           /* For each place where the biv is incremented, add an insn
5354              to increment the new, reduced reg for the giv.  */
5355           for (tv = bl->biv; tv; tv = tv->next_iv)
5356             {
5357               rtx insert_before;
5358
5359               /* Skip if location is the same as a previous one.  */
5360               if (tv->same)
5361                 continue;
5362               if (! auto_inc_opt)
5363                 insert_before = NEXT_INSN (tv->insn);
5364               else if (auto_inc_opt == 1)
5365                 insert_before = NEXT_INSN (v->insn);
5366               else
5367                 insert_before = v->insn;
5368
5369               if (tv->mult_val == const1_rtx)
5370                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
5371                                               v->new_reg, v->new_reg,
5372                                               0, insert_before);
5373               else /* tv->mult_val == const0_rtx */
5374                 /* A multiply is acceptable here
5375                    since this is presumed to be seldom executed.  */
5376                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
5377                                               v->add_val, v->new_reg,
5378                                               0, insert_before);
5379             }
5380
5381           /* Add code at loop start to initialize giv's reduced reg.  */
5382
5383           loop_iv_add_mult_hoist (loop,
5384                                   extend_value_for_giv (v, bl->initial_value),
5385                                   v->mult_val, v->add_val, v->new_reg);
5386         }
5387     }
5388 }
5389
5390
5391 /* Check for givs whose first use is their definition and whose
5392    last use is the definition of another giv.  If so, it is likely
5393    dead and should not be used to derive another giv nor to
5394    eliminate a biv.  */
5395
5396 static void
5397 loop_givs_dead_check (struct loop *loop ATTRIBUTE_UNUSED, struct iv_class *bl)
5398 {
5399   struct induction *v;
5400
5401   for (v = bl->giv; v; v = v->next_iv)
5402     {
5403       if (v->ignore
5404           || (v->same && v->same->ignore))
5405         continue;
5406
5407       if (v->giv_type == DEST_REG
5408           && REGNO_FIRST_UID (REGNO (v->dest_reg)) == INSN_UID (v->insn))
5409         {
5410           struct induction *v1;
5411
5412           for (v1 = bl->giv; v1; v1 = v1->next_iv)
5413             if (REGNO_LAST_UID (REGNO (v->dest_reg)) == INSN_UID (v1->insn))
5414               v->maybe_dead = 1;
5415         }
5416     }
5417 }
5418
5419
5420 static void
5421 loop_givs_rescan (struct loop *loop, struct iv_class *bl, rtx *reg_map)
5422 {
5423   struct induction *v;
5424
5425   for (v = bl->giv; v; v = v->next_iv)
5426     {
5427       if (v->same && v->same->ignore)
5428         v->ignore = 1;
5429
5430       if (v->ignore)
5431         continue;
5432
5433       /* Update expression if this was combined, in case other giv was
5434          replaced.  */
5435       if (v->same)
5436         v->new_reg = replace_rtx (v->new_reg,
5437                                   v->same->dest_reg, v->same->new_reg);
5438
5439       /* See if this register is known to be a pointer to something.  If
5440          so, see if we can find the alignment.  First see if there is a
5441          destination register that is a pointer.  If so, this shares the
5442          alignment too.  Next see if we can deduce anything from the
5443          computational information.  If not, and this is a DEST_ADDR
5444          giv, at least we know that it's a pointer, though we don't know
5445          the alignment.  */
5446       if (REG_P (v->new_reg)
5447           && v->giv_type == DEST_REG
5448           && REG_POINTER (v->dest_reg))
5449         mark_reg_pointer (v->new_reg,
5450                           REGNO_POINTER_ALIGN (REGNO (v->dest_reg)));
5451       else if (REG_P (v->new_reg)
5452                && REG_POINTER (v->src_reg))
5453         {
5454           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->src_reg));
5455
5456           if (align == 0
5457               || GET_CODE (v->add_val) != CONST_INT
5458               || INTVAL (v->add_val) % (align / BITS_PER_UNIT) != 0)
5459             align = 0;
5460
5461           mark_reg_pointer (v->new_reg, align);
5462         }
5463       else if (REG_P (v->new_reg)
5464                && REG_P (v->add_val)
5465                && REG_POINTER (v->add_val))
5466         {
5467           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->add_val));
5468
5469           if (align == 0 || GET_CODE (v->mult_val) != CONST_INT
5470               || INTVAL (v->mult_val) % (align / BITS_PER_UNIT) != 0)
5471             align = 0;
5472
5473           mark_reg_pointer (v->new_reg, align);
5474         }
5475       else if (REG_P (v->new_reg) && v->giv_type == DEST_ADDR)
5476         mark_reg_pointer (v->new_reg, 0);
5477
5478       if (v->giv_type == DEST_ADDR)
5479         {
5480           /* Store reduced reg as the address in the memref where we found
5481              this giv.  */
5482           if (validate_change_maybe_volatile (v->insn, v->location,
5483                                               v->new_reg))
5484             /* Yay, it worked!  */;
5485           /* Not replaceable; emit an insn to set the original
5486              giv reg from the reduced giv.  */
5487           else if (REG_P (*v->location))
5488             loop_insn_emit_before (loop, 0, v->insn,
5489                                    gen_move_insn (*v->location,
5490                                                   v->new_reg));
5491           else if (GET_CODE (*v->location) == PLUS
5492                    && REG_P (XEXP (*v->location, 0))
5493                    && CONSTANT_P (XEXP (*v->location, 1)))
5494             loop_insn_emit_before (loop, 0, v->insn,
5495                                    gen_move_insn (XEXP (*v->location, 0),
5496                                                   gen_rtx_MINUS
5497                                                   (GET_MODE (*v->location),
5498                                                    v->new_reg,
5499                                                    XEXP (*v->location, 1))));
5500           else
5501             {
5502               /* If it wasn't a reg, create a pseudo and use that.  */
5503               rtx reg, seq;
5504               start_sequence ();
5505               reg = force_reg (v->mode, *v->location);
5506               seq = get_insns ();
5507               end_sequence ();
5508               loop_insn_emit_before (loop, 0, v->insn, seq);
5509               if (!validate_change_maybe_volatile (v->insn, v->location, reg))
5510                 gcc_unreachable ();
5511             }
5512         }
5513       else if (v->replaceable)
5514         {
5515           reg_map[REGNO (v->dest_reg)] = v->new_reg;
5516         }
5517       else
5518         {
5519           rtx original_insn = v->insn;
5520           rtx note;
5521
5522           /* Not replaceable; emit an insn to set the original giv reg from
5523              the reduced giv, same as above.  */
5524           v->insn = loop_insn_emit_after (loop, 0, original_insn,
5525                                           gen_move_insn (v->dest_reg,
5526                                                          v->new_reg));
5527
5528           /* The original insn may have a REG_EQUAL note.  This note is
5529              now incorrect and may result in invalid substitutions later.
5530              The original insn is dead, but may be part of a libcall
5531              sequence, which doesn't seem worth the bother of handling.  */
5532           note = find_reg_note (original_insn, REG_EQUAL, NULL_RTX);
5533           if (note)
5534             remove_note (original_insn, note);
5535         }
5536
5537       /* When a loop is reversed, givs which depend on the reversed
5538          biv, and which are live outside the loop, must be set to their
5539          correct final value.  This insn is only needed if the giv is
5540          not replaceable.  The correct final value is the same as the
5541          value that the giv starts the reversed loop with.  */
5542       if (bl->reversed && ! v->replaceable)
5543         loop_iv_add_mult_sink (loop,
5544                                extend_value_for_giv (v, bl->initial_value),
5545                                v->mult_val, v->add_val, v->dest_reg);
5546       else if (v->final_value)
5547         loop_insn_sink_or_swim (loop,
5548                                 gen_load_of_final_value (v->dest_reg,
5549                                                          v->final_value));
5550
5551       if (loop_dump_stream)
5552         {
5553           fprintf (loop_dump_stream, "giv at %d reduced to ",
5554                    INSN_UID (v->insn));
5555           print_simple_rtl (loop_dump_stream, v->new_reg);
5556           fprintf (loop_dump_stream, "\n");
5557         }
5558     }
5559 }
5560
5561
5562 static int
5563 loop_giv_reduce_benefit (struct loop *loop ATTRIBUTE_UNUSED,
5564                          struct iv_class *bl, struct induction *v,
5565                          rtx test_reg)
5566 {
5567   int add_cost;
5568   int benefit;
5569
5570   benefit = v->benefit;
5571   PUT_MODE (test_reg, v->mode);
5572   add_cost = iv_add_mult_cost (bl->biv->add_val, v->mult_val,
5573                                test_reg, test_reg);
5574
5575   /* Reduce benefit if not replaceable, since we will insert a
5576      move-insn to replace the insn that calculates this giv.  Don't do
5577      this unless the giv is a user variable, since it will often be
5578      marked non-replaceable because of the duplication of the exit
5579      code outside the loop.  In such a case, the copies we insert are
5580      dead and will be deleted.  So they don't have a cost.  Similar
5581      situations exist.  */
5582   /* ??? The new final_[bg]iv_value code does a much better job of
5583      finding replaceable giv's, and hence this code may no longer be
5584      necessary.  */
5585   if (! v->replaceable && ! bl->eliminable
5586       && REG_USERVAR_P (v->dest_reg))
5587     benefit -= copy_cost;
5588
5589   /* Decrease the benefit to count the add-insns that we will insert
5590      to increment the reduced reg for the giv.  ??? This can
5591      overestimate the run-time cost of the additional insns, e.g. if
5592      there are multiple basic blocks that increment the biv, but only
5593      one of these blocks is executed during each iteration.  There is
5594      no good way to detect cases like this with the current structure
5595      of the loop optimizer.  This code is more accurate for
5596      determining code size than run-time benefits.  */
5597   benefit -= add_cost * bl->biv_count;
5598
5599   /* Decide whether to strength-reduce this giv or to leave the code
5600      unchanged (recompute it from the biv each time it is used).  This
5601      decision can be made independently for each giv.  */
5602
5603 #ifdef AUTO_INC_DEC
5604   /* Attempt to guess whether autoincrement will handle some of the
5605      new add insns; if so, increase BENEFIT (undo the subtraction of
5606      add_cost that was done above).  */
5607   if (v->giv_type == DEST_ADDR
5608       /* Increasing the benefit is risky, since this is only a guess.
5609          Avoid increasing register pressure in cases where there would
5610          be no other benefit from reducing this giv.  */
5611       && benefit > 0
5612       && GET_CODE (v->mult_val) == CONST_INT)
5613     {
5614       int size = GET_MODE_SIZE (GET_MODE (v->mem));
5615
5616       if (HAVE_POST_INCREMENT
5617           && INTVAL (v->mult_val) == size)
5618         benefit += add_cost * bl->biv_count;
5619       else if (HAVE_PRE_INCREMENT
5620                && INTVAL (v->mult_val) == size)
5621         benefit += add_cost * bl->biv_count;
5622       else if (HAVE_POST_DECREMENT
5623                && -INTVAL (v->mult_val) == size)
5624         benefit += add_cost * bl->biv_count;
5625       else if (HAVE_PRE_DECREMENT
5626                && -INTVAL (v->mult_val) == size)
5627         benefit += add_cost * bl->biv_count;
5628     }
5629 #endif
5630
5631   return benefit;
5632 }
5633
5634
5635 /* Free IV structures for LOOP.  */
5636
5637 static void
5638 loop_ivs_free (struct loop *loop)
5639 {
5640   struct loop_ivs *ivs = LOOP_IVS (loop);
5641   struct iv_class *iv = ivs->list;
5642
5643   free (ivs->regs);
5644
5645   while (iv)
5646     {
5647       struct iv_class *next = iv->next;
5648       struct induction *induction;
5649       struct induction *next_induction;
5650
5651       for (induction = iv->biv; induction; induction = next_induction)
5652         {
5653           next_induction = induction->next_iv;
5654           free (induction);
5655         }
5656       for (induction = iv->giv; induction; induction = next_induction)
5657         {
5658           next_induction = induction->next_iv;
5659           free (induction);
5660         }
5661
5662       free (iv);
5663       iv = next;
5664     }
5665 }
5666
5667 /* Look back before LOOP->START for the insn that sets REG and return
5668    the equivalent constant if there is a REG_EQUAL note otherwise just
5669    the SET_SRC of REG.  */
5670
5671 static rtx
5672 loop_find_equiv_value (const struct loop *loop, rtx reg)
5673 {
5674   rtx loop_start = loop->start;
5675   rtx insn, set;
5676   rtx ret;
5677
5678   ret = reg;
5679   for (insn = PREV_INSN (loop_start); insn; insn = PREV_INSN (insn))
5680     {
5681       if (LABEL_P (insn))
5682         break;
5683
5684       else if (INSN_P (insn) && reg_set_p (reg, insn))
5685         {
5686           /* We found the last insn before the loop that sets the register.
5687              If it sets the entire register, and has a REG_EQUAL note,
5688              then use the value of the REG_EQUAL note.  */
5689           if ((set = single_set (insn))
5690               && (SET_DEST (set) == reg))
5691             {
5692               rtx note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
5693
5694               /* Only use the REG_EQUAL note if it is a constant.
5695                  Other things, divide in particular, will cause
5696                  problems later if we use them.  */
5697               if (note && GET_CODE (XEXP (note, 0)) != EXPR_LIST
5698                   && CONSTANT_P (XEXP (note, 0)))
5699                 ret = XEXP (note, 0);
5700               else
5701                 ret = SET_SRC (set);
5702
5703               /* We cannot do this if it changes between the
5704                  assignment and loop start though.  */
5705               if (modified_between_p (ret, insn, loop_start))
5706                 ret = reg;
5707             }
5708           break;
5709         }
5710     }
5711   return ret;
5712 }
5713
5714 /* Find and return register term common to both expressions OP0 and
5715    OP1 or NULL_RTX if no such term exists.  Each expression must be a
5716    REG or a PLUS of a REG.  */
5717
5718 static rtx
5719 find_common_reg_term (rtx op0, rtx op1)
5720 {
5721   if ((REG_P (op0) || GET_CODE (op0) == PLUS)
5722       && (REG_P (op1) || GET_CODE (op1) == PLUS))
5723     {
5724       rtx op00;
5725       rtx op01;
5726       rtx op10;
5727       rtx op11;
5728
5729       if (GET_CODE (op0) == PLUS)
5730         op01 = XEXP (op0, 1), op00 = XEXP (op0, 0);
5731       else
5732         op01 = const0_rtx, op00 = op0;
5733
5734       if (GET_CODE (op1) == PLUS)
5735         op11 = XEXP (op1, 1), op10 = XEXP (op1, 0);
5736       else
5737         op11 = const0_rtx, op10 = op1;
5738
5739       /* Find and return common register term if present.  */
5740       if (REG_P (op00) && (op00 == op10 || op00 == op11))
5741         return op00;
5742       else if (REG_P (op01) && (op01 == op10 || op01 == op11))
5743         return op01;
5744     }
5745
5746   /* No common register term found.  */
5747   return NULL_RTX;
5748 }
5749
5750 /* Determine the loop iterator and calculate the number of loop
5751    iterations.  Returns the exact number of loop iterations if it can
5752    be calculated, otherwise returns zero.  */
5753
5754 static unsigned HOST_WIDE_INT
5755 loop_iterations (struct loop *loop)
5756 {
5757   struct loop_info *loop_info = LOOP_INFO (loop);
5758   struct loop_ivs *ivs = LOOP_IVS (loop);
5759   rtx comparison, comparison_value;
5760   rtx iteration_var, initial_value, increment, final_value;
5761   enum rtx_code comparison_code;
5762   HOST_WIDE_INT inc;
5763   unsigned HOST_WIDE_INT abs_inc;
5764   unsigned HOST_WIDE_INT abs_diff;
5765   int off_by_one;
5766   int increment_dir;
5767   int unsigned_p, compare_dir, final_larger;
5768   rtx last_loop_insn;
5769   struct iv_class *bl;
5770
5771   loop_info->n_iterations = 0;
5772   loop_info->initial_value = 0;
5773   loop_info->initial_equiv_value = 0;
5774   loop_info->comparison_value = 0;
5775   loop_info->final_value = 0;
5776   loop_info->final_equiv_value = 0;
5777   loop_info->increment = 0;
5778   loop_info->iteration_var = 0;
5779   loop_info->iv = 0;
5780
5781   /* We used to use prev_nonnote_insn here, but that fails because it might
5782      accidentally get the branch for a contained loop if the branch for this
5783      loop was deleted.  We can only trust branches immediately before the
5784      loop_end.  */
5785   last_loop_insn = PREV_INSN (loop->end);
5786
5787   /* ??? We should probably try harder to find the jump insn
5788      at the end of the loop.  The following code assumes that
5789      the last loop insn is a jump to the top of the loop.  */
5790   if (!JUMP_P (last_loop_insn))
5791     {
5792       if (loop_dump_stream)
5793         fprintf (loop_dump_stream,
5794                  "Loop iterations: No final conditional branch found.\n");
5795       return 0;
5796     }
5797
5798   /* If there is a more than a single jump to the top of the loop
5799      we cannot (easily) determine the iteration count.  */
5800   if (LABEL_NUSES (JUMP_LABEL (last_loop_insn)) > 1)
5801     {
5802       if (loop_dump_stream)
5803         fprintf (loop_dump_stream,
5804                  "Loop iterations: Loop has multiple back edges.\n");
5805       return 0;
5806     }
5807
5808   /* Find the iteration variable.  If the last insn is a conditional
5809      branch, and the insn before tests a register value, make that the
5810      iteration variable.  */
5811
5812   comparison = get_condition_for_loop (loop, last_loop_insn);
5813   if (comparison == 0)
5814     {
5815       if (loop_dump_stream)
5816         fprintf (loop_dump_stream,
5817                  "Loop iterations: No final comparison found.\n");
5818       return 0;
5819     }
5820
5821   /* ??? Get_condition may switch position of induction variable and
5822      invariant register when it canonicalizes the comparison.  */
5823
5824   comparison_code = GET_CODE (comparison);
5825   iteration_var = XEXP (comparison, 0);
5826   comparison_value = XEXP (comparison, 1);
5827
5828   if (!REG_P (iteration_var))
5829     {
5830       if (loop_dump_stream)
5831         fprintf (loop_dump_stream,
5832                  "Loop iterations: Comparison not against register.\n");
5833       return 0;
5834     }
5835
5836   /* The only new registers that are created before loop iterations
5837      are givs made from biv increments or registers created by
5838      load_mems.  In the latter case, it is possible that try_copy_prop
5839      will propagate a new pseudo into the old iteration register but
5840      this will be marked by having the REG_USERVAR_P bit set.  */
5841
5842   gcc_assert ((unsigned) REGNO (iteration_var) < ivs->n_regs
5843               || REG_USERVAR_P (iteration_var));
5844
5845   /* Determine the initial value of the iteration variable, and the amount
5846      that it is incremented each loop.  Use the tables constructed by
5847      the strength reduction pass to calculate these values.  */
5848
5849   /* Clear the result values, in case no answer can be found.  */
5850   initial_value = 0;
5851   increment = 0;
5852
5853   /* The iteration variable can be either a giv or a biv.  Check to see
5854      which it is, and compute the variable's initial value, and increment
5855      value if possible.  */
5856
5857   /* If this is a new register, can't handle it since we don't have any
5858      reg_iv_type entry for it.  */
5859   if ((unsigned) REGNO (iteration_var) >= ivs->n_regs)
5860     {
5861       if (loop_dump_stream)
5862         fprintf (loop_dump_stream,
5863                  "Loop iterations: No reg_iv_type entry for iteration var.\n");
5864       return 0;
5865     }
5866
5867   /* Reject iteration variables larger than the host wide int size, since they
5868      could result in a number of iterations greater than the range of our
5869      `unsigned HOST_WIDE_INT' variable loop_info->n_iterations.  */
5870   else if ((GET_MODE_BITSIZE (GET_MODE (iteration_var))
5871             > HOST_BITS_PER_WIDE_INT))
5872     {
5873       if (loop_dump_stream)
5874         fprintf (loop_dump_stream,
5875                  "Loop iterations: Iteration var rejected because mode too large.\n");
5876       return 0;
5877     }
5878   else if (GET_MODE_CLASS (GET_MODE (iteration_var)) != MODE_INT)
5879     {
5880       if (loop_dump_stream)
5881         fprintf (loop_dump_stream,
5882                  "Loop iterations: Iteration var not an integer.\n");
5883       return 0;
5884     }
5885
5886   /* Try swapping the comparison to identify a suitable iv.  */
5887   if (REG_IV_TYPE (ivs, REGNO (iteration_var)) != BASIC_INDUCT
5888       && REG_IV_TYPE (ivs, REGNO (iteration_var)) != GENERAL_INDUCT
5889       && REG_P (comparison_value)
5890       && REGNO (comparison_value) < ivs->n_regs)
5891     {
5892       rtx temp = comparison_value;
5893       comparison_code = swap_condition (comparison_code);
5894       comparison_value = iteration_var;
5895       iteration_var = temp;
5896     }
5897
5898   if (REG_IV_TYPE (ivs, REGNO (iteration_var)) == BASIC_INDUCT)
5899     {
5900       gcc_assert (REGNO (iteration_var) < ivs->n_regs);
5901
5902       /* Grab initial value, only useful if it is a constant.  */
5903       bl = REG_IV_CLASS (ivs, REGNO (iteration_var));
5904       initial_value = bl->initial_value;
5905       if (!bl->biv->always_executed || bl->biv->maybe_multiple)
5906         {
5907           if (loop_dump_stream)
5908             fprintf (loop_dump_stream,
5909                      "Loop iterations: Basic induction var not set once in each iteration.\n");
5910           return 0;
5911         }
5912
5913       increment = biv_total_increment (bl);
5914     }
5915   else if (REG_IV_TYPE (ivs, REGNO (iteration_var)) == GENERAL_INDUCT)
5916     {
5917       HOST_WIDE_INT offset = 0;
5918       struct induction *v = REG_IV_INFO (ivs, REGNO (iteration_var));
5919       rtx biv_initial_value;
5920
5921       gcc_assert (REGNO (v->src_reg) < ivs->n_regs);
5922
5923       if (!v->always_executed || v->maybe_multiple)
5924         {
5925           if (loop_dump_stream)
5926             fprintf (loop_dump_stream,
5927                      "Loop iterations: General induction var not set once in each iteration.\n");
5928           return 0;
5929         }
5930
5931       bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
5932
5933       /* Increment value is mult_val times the increment value of the biv.  */
5934
5935       increment = biv_total_increment (bl);
5936       if (increment)
5937         {
5938           struct induction *biv_inc;
5939
5940           increment = fold_rtx_mult_add (v->mult_val,
5941                                          extend_value_for_giv (v, increment),
5942                                          const0_rtx, v->mode);
5943           /* The caller assumes that one full increment has occurred at the
5944              first loop test.  But that's not true when the biv is incremented
5945              after the giv is set (which is the usual case), e.g.:
5946              i = 6; do {;} while (i++ < 9) .
5947              Therefore, we bias the initial value by subtracting the amount of
5948              the increment that occurs between the giv set and the giv test.  */
5949           for (biv_inc = bl->biv; biv_inc; biv_inc = biv_inc->next_iv)
5950             {
5951               if (loop_insn_first_p (v->insn, biv_inc->insn))
5952                 {
5953                   if (REG_P (biv_inc->add_val))
5954                     {
5955                       if (loop_dump_stream)
5956                         fprintf (loop_dump_stream,
5957                                  "Loop iterations: Basic induction var add_val is REG %d.\n",
5958                                  REGNO (biv_inc->add_val));
5959                         return 0;
5960                     }
5961
5962                   /* If we have already counted it, skip it.  */
5963                   if (biv_inc->same)
5964                     continue;
5965
5966                   offset -= INTVAL (biv_inc->add_val);
5967                 }
5968             }
5969         }
5970       if (loop_dump_stream)
5971         fprintf (loop_dump_stream,
5972                  "Loop iterations: Giv iterator, initial value bias %ld.\n",
5973                  (long) offset);
5974
5975       /* Initial value is mult_val times the biv's initial value plus
5976          add_val.  Only useful if it is a constant.  */
5977       biv_initial_value = extend_value_for_giv (v, bl->initial_value);
5978       initial_value
5979         = fold_rtx_mult_add (v->mult_val,
5980                              plus_constant (biv_initial_value, offset),
5981                              v->add_val, v->mode);
5982     }
5983   else
5984     {
5985       if (loop_dump_stream)
5986         fprintf (loop_dump_stream,
5987                  "Loop iterations: Not basic or general induction var.\n");
5988       return 0;
5989     }
5990
5991   if (initial_value == 0)
5992     return 0;
5993
5994   unsigned_p = 0;
5995   off_by_one = 0;
5996   switch (comparison_code)
5997     {
5998     case LEU:
5999       unsigned_p = 1;
6000     case LE:
6001       compare_dir = 1;
6002       off_by_one = 1;
6003       break;
6004     case GEU:
6005       unsigned_p = 1;
6006     case GE:
6007       compare_dir = -1;
6008       off_by_one = -1;
6009       break;
6010     case EQ:
6011       /* Cannot determine loop iterations with this case.  */
6012       compare_dir = 0;
6013       break;
6014     case LTU:
6015       unsigned_p = 1;
6016     case LT:
6017       compare_dir = 1;
6018       break;
6019     case GTU:
6020       unsigned_p = 1;
6021     case GT:
6022       compare_dir = -1;
6023       break;
6024     case NE:
6025       compare_dir = 0;
6026       break;
6027     default:
6028       gcc_unreachable ();
6029     }
6030
6031   /* If the comparison value is an invariant register, then try to find
6032      its value from the insns before the start of the loop.  */
6033
6034   final_value = comparison_value;
6035   if (REG_P (comparison_value)
6036       && loop_invariant_p (loop, comparison_value))
6037     {
6038       final_value = loop_find_equiv_value (loop, comparison_value);
6039
6040       /* If we don't get an invariant final value, we are better
6041          off with the original register.  */
6042       if (! loop_invariant_p (loop, final_value))
6043         final_value = comparison_value;
6044     }
6045
6046   /* Calculate the approximate final value of the induction variable
6047      (on the last successful iteration).  The exact final value
6048      depends on the branch operator, and increment sign.  It will be
6049      wrong if the iteration variable is not incremented by one each
6050      time through the loop and (comparison_value + off_by_one -
6051      initial_value) % increment != 0.
6052      ??? Note that the final_value may overflow and thus final_larger
6053      will be bogus.  A potentially infinite loop will be classified
6054      as immediate, e.g. for (i = 0x7ffffff0; i <= 0x7fffffff; i++)  */
6055   if (off_by_one)
6056     final_value = plus_constant (final_value, off_by_one);
6057
6058   /* Save the calculated values describing this loop's bounds, in case
6059      precondition_loop_p will need them later.  These values can not be
6060      recalculated inside precondition_loop_p because strength reduction
6061      optimizations may obscure the loop's structure.
6062
6063      These values are only required by precondition_loop_p and insert_bct
6064      whenever the number of iterations cannot be computed at compile time.
6065      Only the difference between final_value and initial_value is
6066      important.  Note that final_value is only approximate.  */
6067   loop_info->initial_value = initial_value;
6068   loop_info->comparison_value = comparison_value;
6069   loop_info->final_value = plus_constant (comparison_value, off_by_one);
6070   loop_info->increment = increment;
6071   loop_info->iteration_var = iteration_var;
6072   loop_info->comparison_code = comparison_code;
6073   loop_info->iv = bl;
6074
6075   /* Try to determine the iteration count for loops such
6076      as (for i = init; i < init + const; i++).  When running the
6077      loop optimization twice, the first pass often converts simple
6078      loops into this form.  */
6079
6080   if (REG_P (initial_value))
6081     {
6082       rtx reg1;
6083       rtx reg2;
6084       rtx const2;
6085
6086       reg1 = initial_value;
6087       if (GET_CODE (final_value) == PLUS)
6088         reg2 = XEXP (final_value, 0), const2 = XEXP (final_value, 1);
6089       else
6090         reg2 = final_value, const2 = const0_rtx;
6091
6092       /* Check for initial_value = reg1, final_value = reg2 + const2,
6093          where reg1 != reg2.  */
6094       if (REG_P (reg2) && reg2 != reg1)
6095         {
6096           rtx temp;
6097
6098           /* Find what reg1 is equivalent to.  Hopefully it will
6099              either be reg2 or reg2 plus a constant.  */
6100           temp = loop_find_equiv_value (loop, reg1);
6101
6102           if (find_common_reg_term (temp, reg2))
6103             initial_value = temp;
6104           else if (loop_invariant_p (loop, reg2))
6105             {
6106               /* Find what reg2 is equivalent to.  Hopefully it will
6107                  either be reg1 or reg1 plus a constant.  Let's ignore
6108                  the latter case for now since it is not so common.  */
6109               temp = loop_find_equiv_value (loop, reg2);
6110
6111               if (temp == loop_info->iteration_var)
6112                 temp = initial_value;
6113               if (temp == reg1)
6114                 final_value = (const2 == const0_rtx)
6115                   ? reg1 : gen_rtx_PLUS (GET_MODE (reg1), reg1, const2);
6116             }
6117         }
6118     }
6119
6120   loop_info->initial_equiv_value = initial_value;
6121   loop_info->final_equiv_value = final_value;
6122
6123   /* For EQ comparison loops, we don't have a valid final value.
6124      Check this now so that we won't leave an invalid value if we
6125      return early for any other reason.  */
6126   if (comparison_code == EQ)
6127     loop_info->final_equiv_value = loop_info->final_value = 0;
6128
6129   if (increment == 0)
6130     {
6131       if (loop_dump_stream)
6132         fprintf (loop_dump_stream,
6133                  "Loop iterations: Increment value can't be calculated.\n");
6134       return 0;
6135     }
6136
6137   if (GET_CODE (increment) != CONST_INT)
6138     {
6139       /* If we have a REG, check to see if REG holds a constant value.  */
6140       /* ??? Other RTL, such as (neg (reg)) is possible here, but it isn't
6141          clear if it is worthwhile to try to handle such RTL.  */
6142       if (REG_P (increment) || GET_CODE (increment) == SUBREG)
6143         increment = loop_find_equiv_value (loop, increment);
6144
6145       if (GET_CODE (increment) != CONST_INT)
6146         {
6147           if (loop_dump_stream)
6148             {
6149               fprintf (loop_dump_stream,
6150                        "Loop iterations: Increment value not constant ");
6151               print_simple_rtl (loop_dump_stream, increment);
6152               fprintf (loop_dump_stream, ".\n");
6153             }
6154           return 0;
6155         }
6156       loop_info->increment = increment;
6157     }
6158
6159   if (GET_CODE (initial_value) != CONST_INT)
6160     {
6161       if (loop_dump_stream)
6162         {
6163           fprintf (loop_dump_stream,
6164                    "Loop iterations: Initial value not constant ");
6165           print_simple_rtl (loop_dump_stream, initial_value);
6166           fprintf (loop_dump_stream, ".\n");
6167         }
6168       return 0;
6169     }
6170   else if (GET_CODE (final_value) != CONST_INT)
6171     {
6172       if (loop_dump_stream)
6173         {
6174           fprintf (loop_dump_stream,
6175                    "Loop iterations: Final value not constant ");
6176           print_simple_rtl (loop_dump_stream, final_value);
6177           fprintf (loop_dump_stream, ".\n");
6178         }
6179       return 0;
6180     }
6181   else if (comparison_code == EQ)
6182     {
6183       rtx inc_once;
6184
6185       if (loop_dump_stream)
6186         fprintf (loop_dump_stream, "Loop iterations: EQ comparison loop.\n");
6187
6188       inc_once = gen_int_mode (INTVAL (initial_value) + INTVAL (increment),
6189                                GET_MODE (iteration_var));
6190
6191       if (inc_once == final_value)
6192         {
6193           /* The iterator value once through the loop is equal to the
6194              comparison value.  Either we have an infinite loop, or
6195              we'll loop twice.  */
6196           if (increment == const0_rtx)
6197             return 0;
6198           loop_info->n_iterations = 2;
6199         }
6200       else
6201         loop_info->n_iterations = 1;
6202
6203       if (GET_CODE (loop_info->initial_value) == CONST_INT)
6204         loop_info->final_value
6205           = gen_int_mode ((INTVAL (loop_info->initial_value)
6206                            + loop_info->n_iterations * INTVAL (increment)),
6207                           GET_MODE (iteration_var));
6208       else
6209         loop_info->final_value
6210           = plus_constant (loop_info->initial_value,
6211                            loop_info->n_iterations * INTVAL (increment));
6212       loop_info->final_equiv_value
6213         = gen_int_mode ((INTVAL (initial_value)
6214                          + loop_info->n_iterations * INTVAL (increment)),
6215                         GET_MODE (iteration_var));
6216       return loop_info->n_iterations;
6217     }
6218
6219   /* Final_larger is 1 if final larger, 0 if they are equal, otherwise -1.  */
6220   if (unsigned_p)
6221     final_larger
6222       = ((unsigned HOST_WIDE_INT) INTVAL (final_value)
6223          > (unsigned HOST_WIDE_INT) INTVAL (initial_value))
6224         - ((unsigned HOST_WIDE_INT) INTVAL (final_value)
6225            < (unsigned HOST_WIDE_INT) INTVAL (initial_value));
6226   else
6227     final_larger = (INTVAL (final_value) > INTVAL (initial_value))
6228       - (INTVAL (final_value) < INTVAL (initial_value));
6229
6230   if (INTVAL (increment) > 0)
6231     increment_dir = 1;
6232   else if (INTVAL (increment) == 0)
6233     increment_dir = 0;
6234   else
6235     increment_dir = -1;
6236
6237   /* There are 27 different cases: compare_dir = -1, 0, 1;
6238      final_larger = -1, 0, 1; increment_dir = -1, 0, 1.
6239      There are 4 normal cases, 4 reverse cases (where the iteration variable
6240      will overflow before the loop exits), 4 infinite loop cases, and 15
6241      immediate exit (0 or 1 iteration depending on loop type) cases.
6242      Only try to optimize the normal cases.  */
6243
6244   /* (compare_dir/final_larger/increment_dir)
6245      Normal cases: (0/-1/-1), (0/1/1), (-1/-1/-1), (1/1/1)
6246      Reverse cases: (0/-1/1), (0/1/-1), (-1/-1/1), (1/1/-1)
6247      Infinite loops: (0/-1/0), (0/1/0), (-1/-1/0), (1/1/0)
6248      Immediate exit: (0/0/X), (-1/0/X), (-1/1/X), (1/0/X), (1/-1/X) */
6249
6250   /* ?? If the meaning of reverse loops (where the iteration variable
6251      will overflow before the loop exits) is undefined, then could
6252      eliminate all of these special checks, and just always assume
6253      the loops are normal/immediate/infinite.  Note that this means
6254      the sign of increment_dir does not have to be known.  Also,
6255      since it does not really hurt if immediate exit loops or infinite loops
6256      are optimized, then that case could be ignored also, and hence all
6257      loops can be optimized.
6258
6259      According to ANSI Spec, the reverse loop case result is undefined,
6260      because the action on overflow is undefined.
6261
6262      See also the special test for NE loops below.  */
6263
6264   if (final_larger == increment_dir && final_larger != 0
6265       && (final_larger == compare_dir || compare_dir == 0))
6266     /* Normal case.  */
6267     ;
6268   else
6269     {
6270       if (loop_dump_stream)
6271         fprintf (loop_dump_stream, "Loop iterations: Not normal loop.\n");
6272       return 0;
6273     }
6274
6275   /* Calculate the number of iterations, final_value is only an approximation,
6276      so correct for that.  Note that abs_diff and n_iterations are
6277      unsigned, because they can be as large as 2^n - 1.  */
6278
6279   inc = INTVAL (increment);
6280   gcc_assert (inc);
6281   if (inc > 0)
6282     {
6283       abs_diff = INTVAL (final_value) - INTVAL (initial_value);
6284       abs_inc = inc;
6285     }
6286   else
6287     {
6288       abs_diff = INTVAL (initial_value) - INTVAL (final_value);
6289       abs_inc = -inc;
6290     }
6291
6292   /* Given that iteration_var is going to iterate over its own mode,
6293      not HOST_WIDE_INT, disregard higher bits that might have come
6294      into the picture due to sign extension of initial and final
6295      values.  */
6296   abs_diff &= ((unsigned HOST_WIDE_INT) 1
6297                << (GET_MODE_BITSIZE (GET_MODE (iteration_var)) - 1)
6298                << 1) - 1;
6299
6300   /* For NE tests, make sure that the iteration variable won't miss
6301      the final value.  If abs_diff mod abs_incr is not zero, then the
6302      iteration variable will overflow before the loop exits, and we
6303      can not calculate the number of iterations.  */
6304   if (compare_dir == 0 && (abs_diff % abs_inc) != 0)
6305     return 0;
6306
6307   /* Note that the number of iterations could be calculated using
6308      (abs_diff + abs_inc - 1) / abs_inc, provided care was taken to
6309      handle potential overflow of the summation.  */
6310   loop_info->n_iterations = abs_diff / abs_inc + ((abs_diff % abs_inc) != 0);
6311   return loop_info->n_iterations;
6312 }
6313
6314 /* Perform strength reduction and induction variable elimination.
6315
6316    Pseudo registers created during this function will be beyond the
6317    last valid index in several tables including
6318    REGS->ARRAY[I].N_TIMES_SET and REGNO_LAST_UID.  This does not cause a
6319    problem here, because the added registers cannot be givs outside of
6320    their loop, and hence will never be reconsidered.  But scan_loop
6321    must check regnos to make sure they are in bounds.  */
6322
6323 static void
6324 strength_reduce (struct loop *loop, int flags)
6325 {
6326   struct loop_info *loop_info = LOOP_INFO (loop);
6327   struct loop_regs *regs = LOOP_REGS (loop);
6328   struct loop_ivs *ivs = LOOP_IVS (loop);
6329   rtx p;
6330   /* Temporary list pointer for traversing ivs->list.  */
6331   struct iv_class *bl;
6332   /* Ratio of extra register life span we can justify
6333      for saving an instruction.  More if loop doesn't call subroutines
6334      since in that case saving an insn makes more difference
6335      and more registers are available.  */
6336   /* ??? could set this to last value of threshold in move_movables */
6337   int threshold = (loop_info->has_call ? 1 : 2) * (3 + n_non_fixed_regs);
6338   /* Map of pseudo-register replacements.  */
6339   rtx *reg_map = NULL;
6340   int reg_map_size;
6341   rtx test_reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
6342   int insn_count = count_insns_in_loop (loop);
6343
6344   addr_placeholder = gen_reg_rtx (Pmode);
6345
6346   ivs->n_regs = max_reg_before_loop;
6347   ivs->regs = xcalloc (ivs->n_regs, sizeof (struct iv));
6348
6349   /* Find all BIVs in loop.  */
6350   loop_bivs_find (loop);
6351
6352   /* Exit if there are no bivs.  */
6353   if (! ivs->list)
6354     {
6355       loop_ivs_free (loop);
6356       return;
6357     }
6358
6359   /* Determine how BIVS are initialized by looking through pre-header
6360      extended basic block.  */
6361   loop_bivs_init_find (loop);
6362
6363   /* Look at the each biv and see if we can say anything better about its
6364      initial value from any initializing insns set up above.  */
6365   loop_bivs_check (loop);
6366
6367   /* Search the loop for general induction variables.  */
6368   loop_givs_find (loop);
6369
6370   /* Try to calculate and save the number of loop iterations.  This is
6371      set to zero if the actual number can not be calculated.  This must
6372      be called after all giv's have been identified, since otherwise it may
6373      fail if the iteration variable is a giv.  */
6374   loop_iterations (loop);
6375
6376 #ifdef HAVE_prefetch
6377   if (flags & LOOP_PREFETCH)
6378     emit_prefetch_instructions (loop);
6379 #endif
6380
6381   /* Now for each giv for which we still don't know whether or not it is
6382      replaceable, check to see if it is replaceable because its final value
6383      can be calculated.  This must be done after loop_iterations is called,
6384      so that final_giv_value will work correctly.  */
6385   loop_givs_check (loop);
6386
6387   /* Try to prove that the loop counter variable (if any) is always
6388      nonnegative; if so, record that fact with a REG_NONNEG note
6389      so that "decrement and branch until zero" insn can be used.  */
6390   check_dbra_loop (loop, insn_count);
6391
6392   /* Create reg_map to hold substitutions for replaceable giv regs.
6393      Some givs might have been made from biv increments, so look at
6394      ivs->reg_iv_type for a suitable size.  */
6395   reg_map_size = ivs->n_regs;
6396   reg_map = xcalloc (reg_map_size, sizeof (rtx));
6397
6398   /* Examine each iv class for feasibility of strength reduction/induction
6399      variable elimination.  */
6400
6401   for (bl = ivs->list; bl; bl = bl->next)
6402     {
6403       struct induction *v;
6404       int benefit;
6405
6406       /* Test whether it will be possible to eliminate this biv
6407          provided all givs are reduced.  */
6408       bl->eliminable = loop_biv_eliminable_p (loop, bl, threshold, insn_count);
6409
6410       /* This will be true at the end, if all givs which depend on this
6411          biv have been strength reduced.
6412          We can't (currently) eliminate the biv unless this is so.  */
6413       bl->all_reduced = 1;
6414
6415       /* Check each extension dependent giv in this class to see if its
6416          root biv is safe from wrapping in the interior mode.  */
6417       check_ext_dependent_givs (loop, bl);
6418
6419       /* Combine all giv's for this iv_class.  */
6420       combine_givs (regs, bl);
6421
6422       for (v = bl->giv; v; v = v->next_iv)
6423         {
6424           struct induction *tv;
6425
6426           if (v->ignore || v->same)
6427             continue;
6428
6429           benefit = loop_giv_reduce_benefit (loop, bl, v, test_reg);
6430
6431           /* If an insn is not to be strength reduced, then set its ignore
6432              flag, and clear bl->all_reduced.  */
6433
6434           /* A giv that depends on a reversed biv must be reduced if it is
6435              used after the loop exit, otherwise, it would have the wrong
6436              value after the loop exit.  To make it simple, just reduce all
6437              of such giv's whether or not we know they are used after the loop
6438              exit.  */
6439
6440           if (v->lifetime * threshold * benefit < insn_count
6441               && ! bl->reversed)
6442             {
6443               if (loop_dump_stream)
6444                 fprintf (loop_dump_stream,
6445                          "giv of insn %d not worth while, %d vs %d.\n",
6446                          INSN_UID (v->insn),
6447                          v->lifetime * threshold * benefit, insn_count);
6448               v->ignore = 1;
6449               bl->all_reduced = 0;
6450             }
6451           else
6452             {
6453               /* Check that we can increment the reduced giv without a
6454                  multiply insn.  If not, reject it.  */
6455
6456               for (tv = bl->biv; tv; tv = tv->next_iv)
6457                 if (tv->mult_val == const1_rtx
6458                     && ! product_cheap_p (tv->add_val, v->mult_val))
6459                   {
6460                     if (loop_dump_stream)
6461                       fprintf (loop_dump_stream,
6462                                "giv of insn %d: would need a multiply.\n",
6463                                INSN_UID (v->insn));
6464                     v->ignore = 1;
6465                     bl->all_reduced = 0;
6466                     break;
6467                   }
6468             }
6469         }
6470
6471       /* Check for givs whose first use is their definition and whose
6472          last use is the definition of another giv.  If so, it is likely
6473          dead and should not be used to derive another giv nor to
6474          eliminate a biv.  */
6475       loop_givs_dead_check (loop, bl);
6476
6477       /* Reduce each giv that we decided to reduce.  */
6478       loop_givs_reduce (loop, bl);
6479
6480       /* Rescan all givs.  If a giv is the same as a giv not reduced, mark it
6481          as not reduced.
6482
6483          For each giv register that can be reduced now: if replaceable,
6484          substitute reduced reg wherever the old giv occurs;
6485          else add new move insn "giv_reg = reduced_reg".  */
6486       loop_givs_rescan (loop, bl, reg_map);
6487
6488       /* All the givs based on the biv bl have been reduced if they
6489          merit it.  */
6490
6491       /* For each giv not marked as maybe dead that has been combined with a
6492          second giv, clear any "maybe dead" mark on that second giv.
6493          v->new_reg will either be or refer to the register of the giv it
6494          combined with.
6495
6496          Doing this clearing avoids problems in biv elimination where
6497          a giv's new_reg is a complex value that can't be put in the
6498          insn but the giv combined with (with a reg as new_reg) is
6499          marked maybe_dead.  Since the register will be used in either
6500          case, we'd prefer it be used from the simpler giv.  */
6501
6502       for (v = bl->giv; v; v = v->next_iv)
6503         if (! v->maybe_dead && v->same)
6504           v->same->maybe_dead = 0;
6505
6506       /* Try to eliminate the biv, if it is a candidate.
6507          This won't work if ! bl->all_reduced,
6508          since the givs we planned to use might not have been reduced.
6509
6510          We have to be careful that we didn't initially think we could
6511          eliminate this biv because of a giv that we now think may be
6512          dead and shouldn't be used as a biv replacement.
6513
6514          Also, there is the possibility that we may have a giv that looks
6515          like it can be used to eliminate a biv, but the resulting insn
6516          isn't valid.  This can happen, for example, on the 88k, where a
6517          JUMP_INSN can compare a register only with zero.  Attempts to
6518          replace it with a compare with a constant will fail.
6519
6520          Note that in cases where this call fails, we may have replaced some
6521          of the occurrences of the biv with a giv, but no harm was done in
6522          doing so in the rare cases where it can occur.  */
6523
6524       if (bl->all_reduced == 1 && bl->eliminable
6525           && maybe_eliminate_biv (loop, bl, 1, threshold, insn_count))
6526         {
6527           /* ?? If we created a new test to bypass the loop entirely,
6528              or otherwise drop straight in, based on this test, then
6529              we might want to rewrite it also.  This way some later
6530              pass has more hope of removing the initialization of this
6531              biv entirely.  */
6532
6533           /* If final_value != 0, then the biv may be used after loop end
6534              and we must emit an insn to set it just in case.
6535
6536              Reversed bivs already have an insn after the loop setting their
6537              value, so we don't need another one.  We can't calculate the
6538              proper final value for such a biv here anyways.  */
6539           if (bl->final_value && ! bl->reversed)
6540               loop_insn_sink_or_swim (loop,
6541                                       gen_load_of_final_value (bl->biv->dest_reg,
6542                                                                bl->final_value));
6543
6544           if (loop_dump_stream)
6545             fprintf (loop_dump_stream, "Reg %d: biv eliminated\n",
6546                      bl->regno);
6547         }
6548       /* See above note wrt final_value.  But since we couldn't eliminate
6549          the biv, we must set the value after the loop instead of before.  */
6550       else if (bl->final_value && ! bl->reversed)
6551         loop_insn_sink (loop, gen_load_of_final_value (bl->biv->dest_reg,
6552                                                        bl->final_value));
6553     }
6554
6555   /* Go through all the instructions in the loop, making all the
6556      register substitutions scheduled in REG_MAP.  */
6557
6558   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
6559     if (INSN_P (p))
6560       {
6561         replace_regs (PATTERN (p), reg_map, reg_map_size, 0);
6562         replace_regs (REG_NOTES (p), reg_map, reg_map_size, 0);
6563         INSN_CODE (p) = -1;
6564       }
6565
6566   if (loop_dump_stream)
6567     fprintf (loop_dump_stream, "\n");
6568
6569   loop_ivs_free (loop);
6570   if (reg_map)
6571     free (reg_map);
6572 }
6573 \f
6574 /*Record all basic induction variables calculated in the insn.  */
6575 static rtx
6576 check_insn_for_bivs (struct loop *loop, rtx p, int not_every_iteration,
6577                      int maybe_multiple)
6578 {
6579   struct loop_ivs *ivs = LOOP_IVS (loop);
6580   rtx set;
6581   rtx dest_reg;
6582   rtx inc_val;
6583   rtx mult_val;
6584   rtx *location;
6585
6586   if (NONJUMP_INSN_P (p)
6587       && (set = single_set (p))
6588       && REG_P (SET_DEST (set)))
6589     {
6590       dest_reg = SET_DEST (set);
6591       if (REGNO (dest_reg) < max_reg_before_loop
6592           && REGNO (dest_reg) >= FIRST_PSEUDO_REGISTER
6593           && REG_IV_TYPE (ivs, REGNO (dest_reg)) != NOT_BASIC_INDUCT)
6594         {
6595           if (basic_induction_var (loop, SET_SRC (set),
6596                                    GET_MODE (SET_SRC (set)),
6597                                    dest_reg, p, &inc_val, &mult_val,
6598                                    &location))
6599             {
6600               /* It is a possible basic induction variable.
6601                  Create and initialize an induction structure for it.  */
6602
6603               struct induction *v = xmalloc (sizeof (struct induction));
6604
6605               record_biv (loop, v, p, dest_reg, inc_val, mult_val, location,
6606                           not_every_iteration, maybe_multiple);
6607               REG_IV_TYPE (ivs, REGNO (dest_reg)) = BASIC_INDUCT;
6608             }
6609           else if (REGNO (dest_reg) < ivs->n_regs)
6610             REG_IV_TYPE (ivs, REGNO (dest_reg)) = NOT_BASIC_INDUCT;
6611         }
6612     }
6613   return p;
6614 }
6615 \f
6616 /* Record all givs calculated in the insn.
6617    A register is a giv if: it is only set once, it is a function of a
6618    biv and a constant (or invariant), and it is not a biv.  */
6619 static rtx
6620 check_insn_for_givs (struct loop *loop, rtx p, int not_every_iteration,
6621                      int maybe_multiple)
6622 {
6623   struct loop_regs *regs = LOOP_REGS (loop);
6624
6625   rtx set;
6626   /* Look for a general induction variable in a register.  */
6627   if (NONJUMP_INSN_P (p)
6628       && (set = single_set (p))
6629       && REG_P (SET_DEST (set))
6630       && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
6631     {
6632       rtx src_reg;
6633       rtx dest_reg;
6634       rtx add_val;
6635       rtx mult_val;
6636       rtx ext_val;
6637       int benefit;
6638       rtx regnote = 0;
6639       rtx last_consec_insn;
6640
6641       dest_reg = SET_DEST (set);
6642       if (REGNO (dest_reg) < FIRST_PSEUDO_REGISTER)
6643         return p;
6644
6645       if (/* SET_SRC is a giv.  */
6646           (general_induction_var (loop, SET_SRC (set), &src_reg, &add_val,
6647                                   &mult_val, &ext_val, 0, &benefit, VOIDmode)
6648            /* Equivalent expression is a giv.  */
6649            || ((regnote = find_reg_note (p, REG_EQUAL, NULL_RTX))
6650                && general_induction_var (loop, XEXP (regnote, 0), &src_reg,
6651                                          &add_val, &mult_val, &ext_val, 0,
6652                                          &benefit, VOIDmode)))
6653           /* Don't try to handle any regs made by loop optimization.
6654              We have nothing on them in regno_first_uid, etc.  */
6655           && REGNO (dest_reg) < max_reg_before_loop
6656           /* Don't recognize a BASIC_INDUCT_VAR here.  */
6657           && dest_reg != src_reg
6658           /* This must be the only place where the register is set.  */
6659           && (regs->array[REGNO (dest_reg)].n_times_set == 1
6660               /* or all sets must be consecutive and make a giv.  */
6661               || (benefit = consec_sets_giv (loop, benefit, p,
6662                                              src_reg, dest_reg,
6663                                              &add_val, &mult_val, &ext_val,
6664                                              &last_consec_insn))))
6665         {
6666           struct induction *v = xmalloc (sizeof (struct induction));
6667
6668           /* If this is a library call, increase benefit.  */
6669           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
6670             benefit += libcall_benefit (p);
6671
6672           /* Skip the consecutive insns, if there are any.  */
6673           if (regs->array[REGNO (dest_reg)].n_times_set != 1)
6674             p = last_consec_insn;
6675
6676           record_giv (loop, v, p, src_reg, dest_reg, mult_val, add_val,
6677                       ext_val, benefit, DEST_REG, not_every_iteration,
6678                       maybe_multiple, (rtx*) 0);
6679
6680         }
6681     }
6682
6683   /* Look for givs which are memory addresses.  */
6684   if (NONJUMP_INSN_P (p))
6685     find_mem_givs (loop, PATTERN (p), p, not_every_iteration,
6686                    maybe_multiple);
6687
6688   /* Update the status of whether giv can derive other givs.  This can
6689      change when we pass a label or an insn that updates a biv.  */
6690   if (INSN_P (p) || LABEL_P (p))
6691     update_giv_derive (loop, p);
6692   return p;
6693 }
6694 \f
6695 /* Return 1 if X is a valid source for an initial value (or as value being
6696    compared against in an initial test).
6697
6698    X must be either a register or constant and must not be clobbered between
6699    the current insn and the start of the loop.
6700
6701    INSN is the insn containing X.  */
6702
6703 static int
6704 valid_initial_value_p (rtx x, rtx insn, int call_seen, rtx loop_start)
6705 {
6706   if (CONSTANT_P (x))
6707     return 1;
6708
6709   /* Only consider pseudos we know about initialized in insns whose luids
6710      we know.  */
6711   if (!REG_P (x)
6712       || REGNO (x) >= max_reg_before_loop)
6713     return 0;
6714
6715   /* Don't use call-clobbered registers across a call which clobbers it.  On
6716      some machines, don't use any hard registers at all.  */
6717   if (REGNO (x) < FIRST_PSEUDO_REGISTER
6718       && (SMALL_REGISTER_CLASSES
6719           || (call_used_regs[REGNO (x)] && call_seen)))
6720     return 0;
6721
6722   /* Don't use registers that have been clobbered before the start of the
6723      loop.  */
6724   if (reg_set_between_p (x, insn, loop_start))
6725     return 0;
6726
6727   return 1;
6728 }
6729 \f
6730 /* Scan X for memory refs and check each memory address
6731    as a possible giv.  INSN is the insn whose pattern X comes from.
6732    NOT_EVERY_ITERATION is 1 if the insn might not be executed during
6733    every loop iteration.  MAYBE_MULTIPLE is 1 if the insn might be executed
6734    more than once in each loop iteration.  */
6735
6736 static void
6737 find_mem_givs (const struct loop *loop, rtx x, rtx insn,
6738                int not_every_iteration, int maybe_multiple)
6739 {
6740   int i, j;
6741   enum rtx_code code;
6742   const char *fmt;
6743
6744   if (x == 0)
6745     return;
6746
6747   code = GET_CODE (x);
6748   switch (code)
6749     {
6750     case REG:
6751     case CONST_INT:
6752     case CONST:
6753     case CONST_DOUBLE:
6754     case SYMBOL_REF:
6755     case LABEL_REF:
6756     case PC:
6757     case CC0:
6758     case ADDR_VEC:
6759     case ADDR_DIFF_VEC:
6760     case USE:
6761     case CLOBBER:
6762       return;
6763
6764     case MEM:
6765       {
6766         rtx src_reg;
6767         rtx add_val;
6768         rtx mult_val;
6769         rtx ext_val;
6770         int benefit;
6771
6772         /* This code used to disable creating GIVs with mult_val == 1 and
6773            add_val == 0.  However, this leads to lost optimizations when
6774            it comes time to combine a set of related DEST_ADDR GIVs, since
6775            this one would not be seen.  */
6776
6777         if (general_induction_var (loop, XEXP (x, 0), &src_reg, &add_val,
6778                                    &mult_val, &ext_val, 1, &benefit,
6779                                    GET_MODE (x)))
6780           {
6781             /* Found one; record it.  */
6782             struct induction *v = xmalloc (sizeof (struct induction));
6783
6784             record_giv (loop, v, insn, src_reg, addr_placeholder, mult_val,
6785                         add_val, ext_val, benefit, DEST_ADDR,
6786                         not_every_iteration, maybe_multiple, &XEXP (x, 0));
6787
6788             v->mem = x;
6789           }
6790       }
6791       return;
6792
6793     default:
6794       break;
6795     }
6796
6797   /* Recursively scan the subexpressions for other mem refs.  */
6798
6799   fmt = GET_RTX_FORMAT (code);
6800   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
6801     if (fmt[i] == 'e')
6802       find_mem_givs (loop, XEXP (x, i), insn, not_every_iteration,
6803                      maybe_multiple);
6804     else if (fmt[i] == 'E')
6805       for (j = 0; j < XVECLEN (x, i); j++)
6806         find_mem_givs (loop, XVECEXP (x, i, j), insn, not_every_iteration,
6807                        maybe_multiple);
6808 }
6809 \f
6810 /* Fill in the data about one biv update.
6811    V is the `struct induction' in which we record the biv.  (It is
6812    allocated by the caller, with alloca.)
6813    INSN is the insn that sets it.
6814    DEST_REG is the biv's reg.
6815
6816    MULT_VAL is const1_rtx if the biv is being incremented here, in which case
6817    INC_VAL is the increment.  Otherwise, MULT_VAL is const0_rtx and the biv is
6818    being set to INC_VAL.
6819
6820    NOT_EVERY_ITERATION is nonzero if this biv update is not know to be
6821    executed every iteration; MAYBE_MULTIPLE is nonzero if this biv update
6822    can be executed more than once per iteration.  If MAYBE_MULTIPLE
6823    and NOT_EVERY_ITERATION are both zero, we know that the biv update is
6824    executed exactly once per iteration.  */
6825
6826 static void
6827 record_biv (struct loop *loop, struct induction *v, rtx insn, rtx dest_reg,
6828             rtx inc_val, rtx mult_val, rtx *location,
6829             int not_every_iteration, int maybe_multiple)
6830 {
6831   struct loop_ivs *ivs = LOOP_IVS (loop);
6832   struct iv_class *bl;
6833
6834   v->insn = insn;
6835   v->src_reg = dest_reg;
6836   v->dest_reg = dest_reg;
6837   v->mult_val = mult_val;
6838   v->add_val = inc_val;
6839   v->ext_dependent = NULL_RTX;
6840   v->location = location;
6841   v->mode = GET_MODE (dest_reg);
6842   v->always_computable = ! not_every_iteration;
6843   v->always_executed = ! not_every_iteration;
6844   v->maybe_multiple = maybe_multiple;
6845   v->same = 0;
6846
6847   /* Add this to the reg's iv_class, creating a class
6848      if this is the first incrementation of the reg.  */
6849
6850   bl = REG_IV_CLASS (ivs, REGNO (dest_reg));
6851   if (bl == 0)
6852     {
6853       /* Create and initialize new iv_class.  */
6854
6855       bl = xmalloc (sizeof (struct iv_class));
6856
6857       bl->regno = REGNO (dest_reg);
6858       bl->biv = 0;
6859       bl->giv = 0;
6860       bl->biv_count = 0;
6861       bl->giv_count = 0;
6862
6863       /* Set initial value to the reg itself.  */
6864       bl->initial_value = dest_reg;
6865       bl->final_value = 0;
6866       /* We haven't seen the initializing insn yet.  */
6867       bl->init_insn = 0;
6868       bl->init_set = 0;
6869       bl->initial_test = 0;
6870       bl->incremented = 0;
6871       bl->eliminable = 0;
6872       bl->nonneg = 0;
6873       bl->reversed = 0;
6874       bl->total_benefit = 0;
6875
6876       /* Add this class to ivs->list.  */
6877       bl->next = ivs->list;
6878       ivs->list = bl;
6879
6880       /* Put it in the array of biv register classes.  */
6881       REG_IV_CLASS (ivs, REGNO (dest_reg)) = bl;
6882     }
6883   else
6884     {
6885       /* Check if location is the same as a previous one.  */
6886       struct induction *induction;
6887       for (induction = bl->biv; induction; induction = induction->next_iv)
6888         if (location == induction->location)
6889           {
6890             v->same = induction;
6891             break;
6892           }
6893     }
6894
6895   /* Update IV_CLASS entry for this biv.  */
6896   v->next_iv = bl->biv;
6897   bl->biv = v;
6898   bl->biv_count++;
6899   if (mult_val == const1_rtx)
6900     bl->incremented = 1;
6901
6902   if (loop_dump_stream)
6903     loop_biv_dump (v, loop_dump_stream, 0);
6904 }
6905 \f
6906 /* Fill in the data about one giv.
6907    V is the `struct induction' in which we record the giv.  (It is
6908    allocated by the caller, with alloca.)
6909    INSN is the insn that sets it.
6910    BENEFIT estimates the savings from deleting this insn.
6911    TYPE is DEST_REG or DEST_ADDR; it says whether the giv is computed
6912    into a register or is used as a memory address.
6913
6914    SRC_REG is the biv reg which the giv is computed from.
6915    DEST_REG is the giv's reg (if the giv is stored in a reg).
6916    MULT_VAL and ADD_VAL are the coefficients used to compute the giv.
6917    LOCATION points to the place where this giv's value appears in INSN.  */
6918
6919 static void
6920 record_giv (const struct loop *loop, struct induction *v, rtx insn,
6921             rtx src_reg, rtx dest_reg, rtx mult_val, rtx add_val,
6922             rtx ext_val, int benefit, enum g_types type,
6923             int not_every_iteration, int maybe_multiple, rtx *location)
6924 {
6925   struct loop_ivs *ivs = LOOP_IVS (loop);
6926   struct induction *b;
6927   struct iv_class *bl;
6928   rtx set = single_set (insn);
6929   rtx temp;
6930
6931   /* Attempt to prove constantness of the values.  Don't let simplify_rtx
6932      undo the MULT canonicalization that we performed earlier.  */
6933   temp = simplify_rtx (add_val);
6934   if (temp
6935       && ! (GET_CODE (add_val) == MULT
6936             && GET_CODE (temp) == ASHIFT))
6937     add_val = temp;
6938
6939   v->insn = insn;
6940   v->src_reg = src_reg;
6941   v->giv_type = type;
6942   v->dest_reg = dest_reg;
6943   v->mult_val = mult_val;
6944   v->add_val = add_val;
6945   v->ext_dependent = ext_val;
6946   v->benefit = benefit;
6947   v->location = location;
6948   v->cant_derive = 0;
6949   v->combined_with = 0;
6950   v->maybe_multiple = maybe_multiple;
6951   v->maybe_dead = 0;
6952   v->derive_adjustment = 0;
6953   v->same = 0;
6954   v->ignore = 0;
6955   v->new_reg = 0;
6956   v->final_value = 0;
6957   v->same_insn = 0;
6958   v->auto_inc_opt = 0;
6959   v->shared = 0;
6960
6961   /* The v->always_computable field is used in update_giv_derive, to
6962      determine whether a giv can be used to derive another giv.  For a
6963      DEST_REG giv, INSN computes a new value for the giv, so its value
6964      isn't computable if INSN insn't executed every iteration.
6965      However, for a DEST_ADDR giv, INSN merely uses the value of the giv;
6966      it does not compute a new value.  Hence the value is always computable
6967      regardless of whether INSN is executed each iteration.  */
6968
6969   if (type == DEST_ADDR)
6970     v->always_computable = 1;
6971   else
6972     v->always_computable = ! not_every_iteration;
6973
6974   v->always_executed = ! not_every_iteration;
6975
6976   if (type == DEST_ADDR)
6977     {
6978       v->mode = GET_MODE (*location);
6979       v->lifetime = 1;
6980     }
6981   else /* type == DEST_REG */
6982     {
6983       v->mode = GET_MODE (SET_DEST (set));
6984
6985       v->lifetime = LOOP_REG_LIFETIME (loop, REGNO (dest_reg));
6986
6987       /* If the lifetime is zero, it means that this register is
6988          really a dead store.  So mark this as a giv that can be
6989          ignored.  This will not prevent the biv from being eliminated.  */
6990       if (v->lifetime == 0)
6991         v->ignore = 1;
6992
6993       REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
6994       REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
6995     }
6996
6997   /* Add the giv to the class of givs computed from one biv.  */
6998
6999   bl = REG_IV_CLASS (ivs, REGNO (src_reg));
7000   gcc_assert (bl);
7001   v->next_iv = bl->giv;
7002   bl->giv = v;
7003
7004   /* Don't count DEST_ADDR.  This is supposed to count the number of
7005      insns that calculate givs.  */
7006   if (type == DEST_REG)
7007     bl->giv_count++;
7008   bl->total_benefit += benefit;
7009
7010   if (type == DEST_ADDR)
7011     {
7012       v->replaceable = 1;
7013       v->not_replaceable = 0;
7014     }
7015   else
7016     {
7017       /* The giv can be replaced outright by the reduced register only if all
7018          of the following conditions are true:
7019          - the insn that sets the giv is always executed on any iteration
7020            on which the giv is used at all
7021            (there are two ways to deduce this:
7022             either the insn is executed on every iteration,
7023             or all uses follow that insn in the same basic block),
7024          - the giv is not used outside the loop
7025          - no assignments to the biv occur during the giv's lifetime.  */
7026
7027       if (REGNO_FIRST_UID (REGNO (dest_reg)) == INSN_UID (insn)
7028           /* Previous line always fails if INSN was moved by loop opt.  */
7029           && REGNO_LAST_LUID (REGNO (dest_reg))
7030           < INSN_LUID (loop->end)
7031           && (! not_every_iteration
7032               || last_use_this_basic_block (dest_reg, insn)))
7033         {
7034           /* Now check that there are no assignments to the biv within the
7035              giv's lifetime.  This requires two separate checks.  */
7036
7037           /* Check each biv update, and fail if any are between the first
7038              and last use of the giv.
7039
7040              If this loop contains an inner loop that was unrolled, then
7041              the insn modifying the biv may have been emitted by the loop
7042              unrolling code, and hence does not have a valid luid.  Just
7043              mark the biv as not replaceable in this case.  It is not very
7044              useful as a biv, because it is used in two different loops.
7045              It is very unlikely that we would be able to optimize the giv
7046              using this biv anyways.  */
7047
7048           v->replaceable = 1;
7049           v->not_replaceable = 0;
7050           for (b = bl->biv; b; b = b->next_iv)
7051             {
7052               if (INSN_UID (b->insn) >= max_uid_for_loop
7053                   || ((INSN_LUID (b->insn)
7054                        >= REGNO_FIRST_LUID (REGNO (dest_reg)))
7055                       && (INSN_LUID (b->insn)
7056                           <= REGNO_LAST_LUID (REGNO (dest_reg)))))
7057                 {
7058                   v->replaceable = 0;
7059                   v->not_replaceable = 1;
7060                   break;
7061                 }
7062             }
7063
7064           /* If there are any backwards branches that go from after the
7065              biv update to before it, then this giv is not replaceable.  */
7066           if (v->replaceable)
7067             for (b = bl->biv; b; b = b->next_iv)
7068               if (back_branch_in_range_p (loop, b->insn))
7069                 {
7070                   v->replaceable = 0;
7071                   v->not_replaceable = 1;
7072                   break;
7073                 }
7074         }
7075       else
7076         {
7077           /* May still be replaceable, we don't have enough info here to
7078              decide.  */
7079           v->replaceable = 0;
7080           v->not_replaceable = 0;
7081         }
7082     }
7083
7084   /* Record whether the add_val contains a const_int, for later use by
7085      combine_givs.  */
7086   {
7087     rtx tem = add_val;
7088
7089     v->no_const_addval = 1;
7090     if (tem == const0_rtx)
7091       ;
7092     else if (CONSTANT_P (add_val))
7093       v->no_const_addval = 0;
7094     if (GET_CODE (tem) == PLUS)
7095       {
7096         while (1)
7097           {
7098             if (GET_CODE (XEXP (tem, 0)) == PLUS)
7099               tem = XEXP (tem, 0);
7100             else if (GET_CODE (XEXP (tem, 1)) == PLUS)
7101               tem = XEXP (tem, 1);
7102             else
7103               break;
7104           }
7105         if (CONSTANT_P (XEXP (tem, 1)))
7106           v->no_const_addval = 0;
7107       }
7108   }
7109
7110   if (loop_dump_stream)
7111     loop_giv_dump (v, loop_dump_stream, 0);
7112 }
7113
7114 /* Try to calculate the final value of the giv, the value it will have at
7115    the end of the loop.  If we can do it, return that value.  */
7116
7117 static rtx
7118 final_giv_value (const struct loop *loop, struct induction *v)
7119 {
7120   struct loop_ivs *ivs = LOOP_IVS (loop);
7121   struct iv_class *bl;
7122   rtx insn;
7123   rtx increment, tem;
7124   rtx seq;
7125   rtx loop_end = loop->end;
7126   unsigned HOST_WIDE_INT n_iterations = LOOP_INFO (loop)->n_iterations;
7127
7128   bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
7129
7130   /* The final value for givs which depend on reversed bivs must be calculated
7131      differently than for ordinary givs.  In this case, there is already an
7132      insn after the loop which sets this giv's final value (if necessary),
7133      and there are no other loop exits, so we can return any value.  */
7134   if (bl->reversed)
7135     {
7136       if (loop_dump_stream)
7137         fprintf (loop_dump_stream,
7138                  "Final giv value for %d, depends on reversed biv\n",
7139                  REGNO (v->dest_reg));
7140       return const0_rtx;
7141     }
7142
7143   /* Try to calculate the final value as a function of the biv it depends
7144      upon.  The only exit from the loop must be the fall through at the bottom
7145      and the insn that sets the giv must be executed on every iteration
7146      (otherwise the giv may not have its final value when the loop exits).  */
7147
7148   /* ??? Can calculate the final giv value by subtracting off the
7149      extra biv increments times the giv's mult_val.  The loop must have
7150      only one exit for this to work, but the loop iterations does not need
7151      to be known.  */
7152
7153   if (n_iterations != 0
7154       && ! loop->exit_count
7155       && v->always_executed)
7156     {
7157       /* ?? It is tempting to use the biv's value here since these insns will
7158          be put after the loop, and hence the biv will have its final value
7159          then.  However, this fails if the biv is subsequently eliminated.
7160          Perhaps determine whether biv's are eliminable before trying to
7161          determine whether giv's are replaceable so that we can use the
7162          biv value here if it is not eliminable.  */
7163
7164       /* We are emitting code after the end of the loop, so we must make
7165          sure that bl->initial_value is still valid then.  It will still
7166          be valid if it is invariant.  */
7167
7168       increment = biv_total_increment (bl);
7169
7170       if (increment && loop_invariant_p (loop, increment)
7171           && loop_invariant_p (loop, bl->initial_value))
7172         {
7173           /* Can calculate the loop exit value of its biv as
7174              (n_iterations * increment) + initial_value */
7175
7176           /* The loop exit value of the giv is then
7177              (final_biv_value - extra increments) * mult_val + add_val.
7178              The extra increments are any increments to the biv which
7179              occur in the loop after the giv's value is calculated.
7180              We must search from the insn that sets the giv to the end
7181              of the loop to calculate this value.  */
7182
7183           /* Put the final biv value in tem.  */
7184           tem = gen_reg_rtx (v->mode);
7185           record_base_value (REGNO (tem), bl->biv->add_val, 0);
7186           loop_iv_add_mult_sink (loop, extend_value_for_giv (v, increment),
7187                                  GEN_INT (n_iterations),
7188                                  extend_value_for_giv (v, bl->initial_value),
7189                                  tem);
7190
7191           /* Subtract off extra increments as we find them.  */
7192           for (insn = NEXT_INSN (v->insn); insn != loop_end;
7193                insn = NEXT_INSN (insn))
7194             {
7195               struct induction *biv;
7196
7197               for (biv = bl->biv; biv; biv = biv->next_iv)
7198                 if (biv->insn == insn)
7199                   {
7200                     start_sequence ();
7201                     tem = expand_simple_binop (GET_MODE (tem), MINUS, tem,
7202                                                biv->add_val, NULL_RTX, 0,
7203                                                OPTAB_LIB_WIDEN);
7204                     seq = get_insns ();
7205                     end_sequence ();
7206                     loop_insn_sink (loop, seq);
7207                   }
7208             }
7209
7210           /* Now calculate the giv's final value.  */
7211           loop_iv_add_mult_sink (loop, tem, v->mult_val, v->add_val, tem);
7212
7213           if (loop_dump_stream)
7214             fprintf (loop_dump_stream,
7215                      "Final giv value for %d, calc from biv's value.\n",
7216                      REGNO (v->dest_reg));
7217
7218           return tem;
7219         }
7220     }
7221
7222   /* Replaceable giv's should never reach here.  */
7223   gcc_assert (!v->replaceable);
7224
7225   /* Check to see if the biv is dead at all loop exits.  */
7226   if (reg_dead_after_loop (loop, v->dest_reg))
7227     {
7228       if (loop_dump_stream)
7229         fprintf (loop_dump_stream,
7230                  "Final giv value for %d, giv dead after loop exit.\n",
7231                  REGNO (v->dest_reg));
7232
7233       return const0_rtx;
7234     }
7235
7236   return 0;
7237 }
7238
7239 /* All this does is determine whether a giv can be made replaceable because
7240    its final value can be calculated.  This code can not be part of record_giv
7241    above, because final_giv_value requires that the number of loop iterations
7242    be known, and that can not be accurately calculated until after all givs
7243    have been identified.  */
7244
7245 static void
7246 check_final_value (const struct loop *loop, struct induction *v)
7247 {
7248   rtx final_value = 0;
7249
7250   /* DEST_ADDR givs will never reach here, because they are always marked
7251      replaceable above in record_giv.  */
7252
7253   /* The giv can be replaced outright by the reduced register only if all
7254      of the following conditions are true:
7255      - the insn that sets the giv is always executed on any iteration
7256        on which the giv is used at all
7257        (there are two ways to deduce this:
7258         either the insn is executed on every iteration,
7259         or all uses follow that insn in the same basic block),
7260      - its final value can be calculated (this condition is different
7261        than the one above in record_giv)
7262      - it's not used before the it's set
7263      - no assignments to the biv occur during the giv's lifetime.  */
7264
7265 #if 0
7266   /* This is only called now when replaceable is known to be false.  */
7267   /* Clear replaceable, so that it won't confuse final_giv_value.  */
7268   v->replaceable = 0;
7269 #endif
7270
7271   if ((final_value = final_giv_value (loop, v))
7272       && (v->always_executed
7273           || last_use_this_basic_block (v->dest_reg, v->insn)))
7274     {
7275       int biv_increment_seen = 0, before_giv_insn = 0;
7276       rtx p = v->insn;
7277       rtx last_giv_use;
7278
7279       v->replaceable = 1;
7280       v->not_replaceable = 0;
7281
7282       /* When trying to determine whether or not a biv increment occurs
7283          during the lifetime of the giv, we can ignore uses of the variable
7284          outside the loop because final_value is true.  Hence we can not
7285          use regno_last_uid and regno_first_uid as above in record_giv.  */
7286
7287       /* Search the loop to determine whether any assignments to the
7288          biv occur during the giv's lifetime.  Start with the insn
7289          that sets the giv, and search around the loop until we come
7290          back to that insn again.
7291
7292          Also fail if there is a jump within the giv's lifetime that jumps
7293          to somewhere outside the lifetime but still within the loop.  This
7294          catches spaghetti code where the execution order is not linear, and
7295          hence the above test fails.  Here we assume that the giv lifetime
7296          does not extend from one iteration of the loop to the next, so as
7297          to make the test easier.  Since the lifetime isn't known yet,
7298          this requires two loops.  See also record_giv above.  */
7299
7300       last_giv_use = v->insn;
7301
7302       while (1)
7303         {
7304           p = NEXT_INSN (p);
7305           if (p == loop->end)
7306             {
7307               before_giv_insn = 1;
7308               p = NEXT_INSN (loop->start);
7309             }
7310           if (p == v->insn)
7311             break;
7312
7313           if (INSN_P (p))
7314             {
7315               /* It is possible for the BIV increment to use the GIV if we
7316                  have a cycle.  Thus we must be sure to check each insn for
7317                  both BIV and GIV uses, and we must check for BIV uses
7318                  first.  */
7319
7320               if (! biv_increment_seen
7321                   && reg_set_p (v->src_reg, PATTERN (p)))
7322                 biv_increment_seen = 1;
7323
7324               if (reg_mentioned_p (v->dest_reg, PATTERN (p)))
7325                 {
7326                   if (biv_increment_seen || before_giv_insn)
7327                     {
7328                       v->replaceable = 0;
7329                       v->not_replaceable = 1;
7330                       break;
7331                     }
7332                   last_giv_use = p;
7333                 }
7334             }
7335         }
7336
7337       /* Now that the lifetime of the giv is known, check for branches
7338          from within the lifetime to outside the lifetime if it is still
7339          replaceable.  */
7340
7341       if (v->replaceable)
7342         {
7343           p = v->insn;
7344           while (1)
7345             {
7346               p = NEXT_INSN (p);
7347               if (p == loop->end)
7348                 p = NEXT_INSN (loop->start);
7349               if (p == last_giv_use)
7350                 break;
7351
7352               if (JUMP_P (p) && JUMP_LABEL (p)
7353                   && LABEL_NAME (JUMP_LABEL (p))
7354                   && ((loop_insn_first_p (JUMP_LABEL (p), v->insn)
7355                        && loop_insn_first_p (loop->start, JUMP_LABEL (p)))
7356                       || (loop_insn_first_p (last_giv_use, JUMP_LABEL (p))
7357                           && loop_insn_first_p (JUMP_LABEL (p), loop->end))))
7358                 {
7359                   v->replaceable = 0;
7360                   v->not_replaceable = 1;
7361
7362                   if (loop_dump_stream)
7363                     fprintf (loop_dump_stream,
7364                              "Found branch outside giv lifetime.\n");
7365
7366                   break;
7367                 }
7368             }
7369         }
7370
7371       /* If it is replaceable, then save the final value.  */
7372       if (v->replaceable)
7373         v->final_value = final_value;
7374     }
7375
7376   if (loop_dump_stream && v->replaceable)
7377     fprintf (loop_dump_stream, "Insn %d: giv reg %d final_value replaceable\n",
7378              INSN_UID (v->insn), REGNO (v->dest_reg));
7379 }
7380 \f
7381 /* Update the status of whether a giv can derive other givs.
7382
7383    We need to do something special if there is or may be an update to the biv
7384    between the time the giv is defined and the time it is used to derive
7385    another giv.
7386
7387    In addition, a giv that is only conditionally set is not allowed to
7388    derive another giv once a label has been passed.
7389
7390    The cases we look at are when a label or an update to a biv is passed.  */
7391
7392 static void
7393 update_giv_derive (const struct loop *loop, rtx p)
7394 {
7395   struct loop_ivs *ivs = LOOP_IVS (loop);
7396   struct iv_class *bl;
7397   struct induction *biv, *giv;
7398   rtx tem;
7399   int dummy;
7400
7401   /* Search all IV classes, then all bivs, and finally all givs.
7402
7403      There are three cases we are concerned with.  First we have the situation
7404      of a giv that is only updated conditionally.  In that case, it may not
7405      derive any givs after a label is passed.
7406
7407      The second case is when a biv update occurs, or may occur, after the
7408      definition of a giv.  For certain biv updates (see below) that are
7409      known to occur between the giv definition and use, we can adjust the
7410      giv definition.  For others, or when the biv update is conditional,
7411      we must prevent the giv from deriving any other givs.  There are two
7412      sub-cases within this case.
7413
7414      If this is a label, we are concerned with any biv update that is done
7415      conditionally, since it may be done after the giv is defined followed by
7416      a branch here (actually, we need to pass both a jump and a label, but
7417      this extra tracking doesn't seem worth it).
7418
7419      If this is a jump, we are concerned about any biv update that may be
7420      executed multiple times.  We are actually only concerned about
7421      backward jumps, but it is probably not worth performing the test
7422      on the jump again here.
7423
7424      If this is a biv update, we must adjust the giv status to show that a
7425      subsequent biv update was performed.  If this adjustment cannot be done,
7426      the giv cannot derive further givs.  */
7427
7428   for (bl = ivs->list; bl; bl = bl->next)
7429     for (biv = bl->biv; biv; biv = biv->next_iv)
7430       if (LABEL_P (p) || JUMP_P (p)
7431           || biv->insn == p)
7432         {
7433           /* Skip if location is the same as a previous one.  */
7434           if (biv->same)
7435             continue;
7436
7437           for (giv = bl->giv; giv; giv = giv->next_iv)
7438             {
7439               /* If cant_derive is already true, there is no point in
7440                  checking all of these conditions again.  */
7441               if (giv->cant_derive)
7442                 continue;
7443
7444               /* If this giv is conditionally set and we have passed a label,
7445                  it cannot derive anything.  */
7446               if (LABEL_P (p) && ! giv->always_computable)
7447                 giv->cant_derive = 1;
7448
7449               /* Skip givs that have mult_val == 0, since
7450                  they are really invariants.  Also skip those that are
7451                  replaceable, since we know their lifetime doesn't contain
7452                  any biv update.  */
7453               else if (giv->mult_val == const0_rtx || giv->replaceable)
7454                 continue;
7455
7456               /* The only way we can allow this giv to derive another
7457                  is if this is a biv increment and we can form the product
7458                  of biv->add_val and giv->mult_val.  In this case, we will
7459                  be able to compute a compensation.  */
7460               else if (biv->insn == p)
7461                 {
7462                   rtx ext_val_dummy;
7463
7464                   tem = 0;
7465                   if (biv->mult_val == const1_rtx)
7466                     tem = simplify_giv_expr (loop,
7467                                              gen_rtx_MULT (giv->mode,
7468                                                            biv->add_val,
7469                                                            giv->mult_val),
7470                                              &ext_val_dummy, &dummy);
7471
7472                   if (tem && giv->derive_adjustment)
7473                     tem = simplify_giv_expr
7474                       (loop,
7475                        gen_rtx_PLUS (giv->mode, tem, giv->derive_adjustment),
7476                        &ext_val_dummy, &dummy);
7477
7478                   if (tem)
7479                     giv->derive_adjustment = tem;
7480                   else
7481                     giv->cant_derive = 1;
7482                 }
7483               else if ((LABEL_P (p) && ! biv->always_computable)
7484                        || (JUMP_P (p) && biv->maybe_multiple))
7485                 giv->cant_derive = 1;
7486             }
7487         }
7488 }
7489 \f
7490 /* Check whether an insn is an increment legitimate for a basic induction var.
7491    X is the source of insn P, or a part of it.
7492    MODE is the mode in which X should be interpreted.
7493
7494    DEST_REG is the putative biv, also the destination of the insn.
7495    We accept patterns of these forms:
7496      REG = REG + INVARIANT (includes REG = REG - CONSTANT)
7497      REG = INVARIANT + REG
7498
7499    If X is suitable, we return 1, set *MULT_VAL to CONST1_RTX,
7500    store the additive term into *INC_VAL, and store the place where
7501    we found the additive term into *LOCATION.
7502
7503    If X is an assignment of an invariant into DEST_REG, we set
7504    *MULT_VAL to CONST0_RTX, and store the invariant into *INC_VAL.
7505
7506    We also want to detect a BIV when it corresponds to a variable
7507    whose mode was promoted.  In that case, an increment
7508    of the variable may be a PLUS that adds a SUBREG of that variable to
7509    an invariant and then sign- or zero-extends the result of the PLUS
7510    into the variable.
7511
7512    Most GIVs in such cases will be in the promoted mode, since that is the
7513    probably the natural computation mode (and almost certainly the mode
7514    used for addresses) on the machine.  So we view the pseudo-reg containing
7515    the variable as the BIV, as if it were simply incremented.
7516
7517    Note that treating the entire pseudo as a BIV will result in making
7518    simple increments to any GIVs based on it.  However, if the variable
7519    overflows in its declared mode but not its promoted mode, the result will
7520    be incorrect.  This is acceptable if the variable is signed, since
7521    overflows in such cases are undefined, but not if it is unsigned, since
7522    those overflows are defined.  So we only check for SIGN_EXTEND and
7523    not ZERO_EXTEND.
7524
7525    If we cannot find a biv, we return 0.  */
7526
7527 static int
7528 basic_induction_var (const struct loop *loop, rtx x, enum machine_mode mode,
7529                      rtx dest_reg, rtx p, rtx *inc_val, rtx *mult_val,
7530                      rtx **location)
7531 {
7532   enum rtx_code code;
7533   rtx *argp, arg;
7534   rtx insn, set = 0, last, inc;
7535
7536   code = GET_CODE (x);
7537   *location = NULL;
7538   switch (code)
7539     {
7540     case PLUS:
7541       if (rtx_equal_p (XEXP (x, 0), dest_reg)
7542           || (GET_CODE (XEXP (x, 0)) == SUBREG
7543               && SUBREG_PROMOTED_VAR_P (XEXP (x, 0))
7544               && SUBREG_REG (XEXP (x, 0)) == dest_reg))
7545         {
7546           argp = &XEXP (x, 1);
7547         }
7548       else if (rtx_equal_p (XEXP (x, 1), dest_reg)
7549                || (GET_CODE (XEXP (x, 1)) == SUBREG
7550                    && SUBREG_PROMOTED_VAR_P (XEXP (x, 1))
7551                    && SUBREG_REG (XEXP (x, 1)) == dest_reg))
7552         {
7553           argp = &XEXP (x, 0);
7554         }
7555       else
7556         return 0;
7557
7558       arg = *argp;
7559       if (loop_invariant_p (loop, arg) != 1)
7560         return 0;
7561
7562       /* convert_modes can emit new instructions, e.g. when arg is a loop
7563          invariant MEM and dest_reg has a different mode.
7564          These instructions would be emitted after the end of the function
7565          and then *inc_val would be an uninitialized pseudo.
7566          Detect this and bail in this case.
7567          Other alternatives to solve this can be introducing a convert_modes
7568          variant which is allowed to fail but not allowed to emit new
7569          instructions, emit these instructions before loop start and let
7570          it be garbage collected if *inc_val is never used or saving the
7571          *inc_val initialization sequence generated here and when *inc_val
7572          is going to be actually used, emit it at some suitable place.  */
7573       last = get_last_insn ();
7574       inc = convert_modes (GET_MODE (dest_reg), GET_MODE (x), arg, 0);
7575       if (get_last_insn () != last)
7576         {
7577           delete_insns_since (last);
7578           return 0;
7579         }
7580
7581       *inc_val = inc;
7582       *mult_val = const1_rtx;
7583       *location = argp;
7584       return 1;
7585
7586     case SUBREG:
7587       /* If what's inside the SUBREG is a BIV, then the SUBREG.  This will
7588          handle addition of promoted variables.
7589          ??? The comment at the start of this function is wrong: promoted
7590          variable increments don't look like it says they do.  */
7591       return basic_induction_var (loop, SUBREG_REG (x),
7592                                   GET_MODE (SUBREG_REG (x)),
7593                                   dest_reg, p, inc_val, mult_val, location);
7594
7595     case REG:
7596       /* If this register is assigned in a previous insn, look at its
7597          source, but don't go outside the loop or past a label.  */
7598
7599       /* If this sets a register to itself, we would repeat any previous
7600          biv increment if we applied this strategy blindly.  */
7601       if (rtx_equal_p (dest_reg, x))
7602         return 0;
7603
7604       insn = p;
7605       while (1)
7606         {
7607           rtx dest;
7608           do
7609             {
7610               insn = PREV_INSN (insn);
7611             }
7612           while (insn && NOTE_P (insn)
7613                  && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
7614
7615           if (!insn)
7616             break;
7617           set = single_set (insn);
7618           if (set == 0)
7619             break;
7620           dest = SET_DEST (set);
7621           if (dest == x
7622               || (GET_CODE (dest) == SUBREG
7623                   && (GET_MODE_SIZE (GET_MODE (dest)) <= UNITS_PER_WORD)
7624                   && (GET_MODE_CLASS (GET_MODE (dest)) == MODE_INT)
7625                   && SUBREG_REG (dest) == x))
7626             return basic_induction_var (loop, SET_SRC (set),
7627                                         (GET_MODE (SET_SRC (set)) == VOIDmode
7628                                          ? GET_MODE (x)
7629                                          : GET_MODE (SET_SRC (set))),
7630                                         dest_reg, insn,
7631                                         inc_val, mult_val, location);
7632
7633           while (GET_CODE (dest) == SUBREG
7634                  || GET_CODE (dest) == ZERO_EXTRACT
7635                  || GET_CODE (dest) == STRICT_LOW_PART)
7636             dest = XEXP (dest, 0);
7637           if (dest == x)
7638             break;
7639         }
7640       /* Fall through.  */
7641
7642       /* Can accept constant setting of biv only when inside inner most loop.
7643          Otherwise, a biv of an inner loop may be incorrectly recognized
7644          as a biv of the outer loop,
7645          causing code to be moved INTO the inner loop.  */
7646     case MEM:
7647       if (loop_invariant_p (loop, x) != 1)
7648         return 0;
7649     case CONST_INT:
7650     case SYMBOL_REF:
7651     case CONST:
7652       /* convert_modes aborts if we try to convert to or from CCmode, so just
7653          exclude that case.  It is very unlikely that a condition code value
7654          would be a useful iterator anyways.  convert_modes aborts if we try to
7655          convert a float mode to non-float or vice versa too.  */
7656       if (loop->level == 1
7657           && GET_MODE_CLASS (mode) == GET_MODE_CLASS (GET_MODE (dest_reg))
7658           && GET_MODE_CLASS (mode) != MODE_CC)
7659         {
7660           /* Possible bug here?  Perhaps we don't know the mode of X.  */
7661           last = get_last_insn ();
7662           inc = convert_modes (GET_MODE (dest_reg), mode, x, 0);
7663           if (get_last_insn () != last)
7664             {
7665               delete_insns_since (last);
7666               return 0;
7667             }
7668
7669           *inc_val = inc;
7670           *mult_val = const0_rtx;
7671           return 1;
7672         }
7673       else
7674         return 0;
7675
7676     case SIGN_EXTEND:
7677       /* Ignore this BIV if signed arithmetic overflow is defined.  */
7678       if (flag_wrapv)
7679         return 0;
7680       return basic_induction_var (loop, XEXP (x, 0), GET_MODE (XEXP (x, 0)),
7681                                   dest_reg, p, inc_val, mult_val, location);
7682
7683     case ASHIFTRT:
7684       /* Similar, since this can be a sign extension.  */
7685       for (insn = PREV_INSN (p);
7686            (insn && NOTE_P (insn)
7687             && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
7688            insn = PREV_INSN (insn))
7689         ;
7690
7691       if (insn)
7692         set = single_set (insn);
7693
7694       if (! rtx_equal_p (dest_reg, XEXP (x, 0))
7695           && set && SET_DEST (set) == XEXP (x, 0)
7696           && GET_CODE (XEXP (x, 1)) == CONST_INT
7697           && INTVAL (XEXP (x, 1)) >= 0
7698           && GET_CODE (SET_SRC (set)) == ASHIFT
7699           && XEXP (x, 1) == XEXP (SET_SRC (set), 1))
7700         return basic_induction_var (loop, XEXP (SET_SRC (set), 0),
7701                                     GET_MODE (XEXP (x, 0)),
7702                                     dest_reg, insn, inc_val, mult_val,
7703                                     location);
7704       return 0;
7705
7706     default:
7707       return 0;
7708     }
7709 }
7710 \f
7711 /* A general induction variable (giv) is any quantity that is a linear
7712    function   of a basic induction variable,
7713    i.e. giv = biv * mult_val + add_val.
7714    The coefficients can be any loop invariant quantity.
7715    A giv need not be computed directly from the biv;
7716    it can be computed by way of other givs.  */
7717
7718 /* Determine whether X computes a giv.
7719    If it does, return a nonzero value
7720      which is the benefit from eliminating the computation of X;
7721    set *SRC_REG to the register of the biv that it is computed from;
7722    set *ADD_VAL and *MULT_VAL to the coefficients,
7723      such that the value of X is biv * mult + add;  */
7724
7725 static int
7726 general_induction_var (const struct loop *loop, rtx x, rtx *src_reg,
7727                        rtx *add_val, rtx *mult_val, rtx *ext_val,
7728                        int is_addr, int *pbenefit,
7729                        enum machine_mode addr_mode)
7730 {
7731   struct loop_ivs *ivs = LOOP_IVS (loop);
7732   rtx orig_x = x;
7733
7734   /* If this is an invariant, forget it, it isn't a giv.  */
7735   if (loop_invariant_p (loop, x) == 1)
7736     return 0;
7737
7738   *pbenefit = 0;
7739   *ext_val = NULL_RTX;
7740   x = simplify_giv_expr (loop, x, ext_val, pbenefit);
7741   if (x == 0)
7742     return 0;
7743
7744   switch (GET_CODE (x))
7745     {
7746     case USE:
7747     case CONST_INT:
7748       /* Since this is now an invariant and wasn't before, it must be a giv
7749          with MULT_VAL == 0.  It doesn't matter which BIV we associate this
7750          with.  */
7751       *src_reg = ivs->list->biv->dest_reg;
7752       *mult_val = const0_rtx;
7753       *add_val = x;
7754       break;
7755
7756     case REG:
7757       /* This is equivalent to a BIV.  */
7758       *src_reg = x;
7759       *mult_val = const1_rtx;
7760       *add_val = const0_rtx;
7761       break;
7762
7763     case PLUS:
7764       /* Either (plus (biv) (invar)) or
7765          (plus (mult (biv) (invar_1)) (invar_2)).  */
7766       if (GET_CODE (XEXP (x, 0)) == MULT)
7767         {
7768           *src_reg = XEXP (XEXP (x, 0), 0);
7769           *mult_val = XEXP (XEXP (x, 0), 1);
7770         }
7771       else
7772         {
7773           *src_reg = XEXP (x, 0);
7774           *mult_val = const1_rtx;
7775         }
7776       *add_val = XEXP (x, 1);
7777       break;
7778
7779     case MULT:
7780       /* ADD_VAL is zero.  */
7781       *src_reg = XEXP (x, 0);
7782       *mult_val = XEXP (x, 1);
7783       *add_val = const0_rtx;
7784       break;
7785
7786     default:
7787       gcc_unreachable ();
7788     }
7789
7790   /* Remove any enclosing USE from ADD_VAL and MULT_VAL (there will be
7791      unless they are CONST_INT).  */
7792   if (GET_CODE (*add_val) == USE)
7793     *add_val = XEXP (*add_val, 0);
7794   if (GET_CODE (*mult_val) == USE)
7795     *mult_val = XEXP (*mult_val, 0);
7796
7797   if (is_addr)
7798     *pbenefit += address_cost (orig_x, addr_mode) - reg_address_cost;
7799   else
7800     *pbenefit += rtx_cost (orig_x, SET);
7801
7802   /* Always return true if this is a giv so it will be detected as such,
7803      even if the benefit is zero or negative.  This allows elimination
7804      of bivs that might otherwise not be eliminated.  */
7805   return 1;
7806 }
7807 \f
7808 /* Given an expression, X, try to form it as a linear function of a biv.
7809    We will canonicalize it to be of the form
7810         (plus (mult (BIV) (invar_1))
7811               (invar_2))
7812    with possible degeneracies.
7813
7814    The invariant expressions must each be of a form that can be used as a
7815    machine operand.  We surround then with a USE rtx (a hack, but localized
7816    and certainly unambiguous!) if not a CONST_INT for simplicity in this
7817    routine; it is the caller's responsibility to strip them.
7818
7819    If no such canonicalization is possible (i.e., two biv's are used or an
7820    expression that is neither invariant nor a biv or giv), this routine
7821    returns 0.
7822
7823    For a nonzero return, the result will have a code of CONST_INT, USE,
7824    REG (for a BIV), PLUS, or MULT.  No other codes will occur.
7825
7826    *BENEFIT will be incremented by the benefit of any sub-giv encountered.  */
7827
7828 static rtx sge_plus (enum machine_mode, rtx, rtx);
7829 static rtx sge_plus_constant (rtx, rtx);
7830
7831 static rtx
7832 simplify_giv_expr (const struct loop *loop, rtx x, rtx *ext_val, int *benefit)
7833 {
7834   struct loop_ivs *ivs = LOOP_IVS (loop);
7835   struct loop_regs *regs = LOOP_REGS (loop);
7836   enum machine_mode mode = GET_MODE (x);
7837   rtx arg0, arg1;
7838   rtx tem;
7839
7840   /* If this is not an integer mode, or if we cannot do arithmetic in this
7841      mode, this can't be a giv.  */
7842   if (mode != VOIDmode
7843       && (GET_MODE_CLASS (mode) != MODE_INT
7844           || GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT))
7845     return NULL_RTX;
7846
7847   switch (GET_CODE (x))
7848     {
7849     case PLUS:
7850       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
7851       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
7852       if (arg0 == 0 || arg1 == 0)
7853         return NULL_RTX;
7854
7855       /* Put constant last, CONST_INT last if both constant.  */
7856       if ((GET_CODE (arg0) == USE
7857            || GET_CODE (arg0) == CONST_INT)
7858           && ! ((GET_CODE (arg0) == USE
7859                  && GET_CODE (arg1) == USE)
7860                 || GET_CODE (arg1) == CONST_INT))
7861         tem = arg0, arg0 = arg1, arg1 = tem;
7862
7863       /* Handle addition of zero, then addition of an invariant.  */
7864       if (arg1 == const0_rtx)
7865         return arg0;
7866       else if (GET_CODE (arg1) == CONST_INT || GET_CODE (arg1) == USE)
7867         switch (GET_CODE (arg0))
7868           {
7869           case CONST_INT:
7870           case USE:
7871             /* Adding two invariants must result in an invariant, so enclose
7872                addition operation inside a USE and return it.  */
7873             if (GET_CODE (arg0) == USE)
7874               arg0 = XEXP (arg0, 0);
7875             if (GET_CODE (arg1) == USE)
7876               arg1 = XEXP (arg1, 0);
7877
7878             if (GET_CODE (arg0) == CONST_INT)
7879               tem = arg0, arg0 = arg1, arg1 = tem;
7880             if (GET_CODE (arg1) == CONST_INT)
7881               tem = sge_plus_constant (arg0, arg1);
7882             else
7883               tem = sge_plus (mode, arg0, arg1);
7884
7885             if (GET_CODE (tem) != CONST_INT)
7886               tem = gen_rtx_USE (mode, tem);
7887             return tem;
7888
7889           case REG:
7890           case MULT:
7891             /* biv + invar or mult + invar.  Return sum.  */
7892             return gen_rtx_PLUS (mode, arg0, arg1);
7893
7894           case PLUS:
7895             /* (a + invar_1) + invar_2.  Associate.  */
7896             return
7897               simplify_giv_expr (loop,
7898                                  gen_rtx_PLUS (mode,
7899                                                XEXP (arg0, 0),
7900                                                gen_rtx_PLUS (mode,
7901                                                              XEXP (arg0, 1),
7902                                                              arg1)),
7903                                  ext_val, benefit);
7904
7905           default:
7906             gcc_unreachable ();
7907           }
7908
7909       /* Each argument must be either REG, PLUS, or MULT.  Convert REG to
7910          MULT to reduce cases.  */
7911       if (REG_P (arg0))
7912         arg0 = gen_rtx_MULT (mode, arg0, const1_rtx);
7913       if (REG_P (arg1))
7914         arg1 = gen_rtx_MULT (mode, arg1, const1_rtx);
7915
7916       /* Now have PLUS + PLUS, PLUS + MULT, MULT + PLUS, or MULT + MULT.
7917          Put a MULT first, leaving PLUS + PLUS, MULT + PLUS, or MULT + MULT.
7918          Recurse to associate the second PLUS.  */
7919       if (GET_CODE (arg1) == MULT)
7920         tem = arg0, arg0 = arg1, arg1 = tem;
7921
7922       if (GET_CODE (arg1) == PLUS)
7923         return
7924           simplify_giv_expr (loop,
7925                              gen_rtx_PLUS (mode,
7926                                            gen_rtx_PLUS (mode, arg0,
7927                                                          XEXP (arg1, 0)),
7928                                            XEXP (arg1, 1)),
7929                              ext_val, benefit);
7930
7931       /* Now must have MULT + MULT.  Distribute if same biv, else not giv.  */
7932       if (GET_CODE (arg0) != MULT || GET_CODE (arg1) != MULT)
7933         return NULL_RTX;
7934
7935       if (!rtx_equal_p (arg0, arg1))
7936         return NULL_RTX;
7937
7938       return simplify_giv_expr (loop,
7939                                 gen_rtx_MULT (mode,
7940                                               XEXP (arg0, 0),
7941                                               gen_rtx_PLUS (mode,
7942                                                             XEXP (arg0, 1),
7943                                                             XEXP (arg1, 1))),
7944                                 ext_val, benefit);
7945
7946     case MINUS:
7947       /* Handle "a - b" as "a + b * (-1)".  */
7948       return simplify_giv_expr (loop,
7949                                 gen_rtx_PLUS (mode,
7950                                               XEXP (x, 0),
7951                                               gen_rtx_MULT (mode,
7952                                                             XEXP (x, 1),
7953                                                             constm1_rtx)),
7954                                 ext_val, benefit);
7955
7956     case MULT:
7957       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
7958       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
7959       if (arg0 == 0 || arg1 == 0)
7960         return NULL_RTX;
7961
7962       /* Put constant last, CONST_INT last if both constant.  */
7963       if ((GET_CODE (arg0) == USE || GET_CODE (arg0) == CONST_INT)
7964           && GET_CODE (arg1) != CONST_INT)
7965         tem = arg0, arg0 = arg1, arg1 = tem;
7966
7967       /* If second argument is not now constant, not giv.  */
7968       if (GET_CODE (arg1) != USE && GET_CODE (arg1) != CONST_INT)
7969         return NULL_RTX;
7970
7971       /* Handle multiply by 0 or 1.  */
7972       if (arg1 == const0_rtx)
7973         return const0_rtx;
7974
7975       else if (arg1 == const1_rtx)
7976         return arg0;
7977
7978       switch (GET_CODE (arg0))
7979         {
7980         case REG:
7981           /* biv * invar.  Done.  */
7982           return gen_rtx_MULT (mode, arg0, arg1);
7983
7984         case CONST_INT:
7985           /* Product of two constants.  */
7986           return GEN_INT (INTVAL (arg0) * INTVAL (arg1));
7987
7988         case USE:
7989           /* invar * invar is a giv, but attempt to simplify it somehow.  */
7990           if (GET_CODE (arg1) != CONST_INT)
7991             return NULL_RTX;
7992
7993           arg0 = XEXP (arg0, 0);
7994           if (GET_CODE (arg0) == MULT)
7995             {
7996               /* (invar_0 * invar_1) * invar_2.  Associate.  */
7997               return simplify_giv_expr (loop,
7998                                         gen_rtx_MULT (mode,
7999                                                       XEXP (arg0, 0),
8000                                                       gen_rtx_MULT (mode,
8001                                                                     XEXP (arg0,
8002                                                                           1),
8003                                                                     arg1)),
8004                                         ext_val, benefit);
8005             }
8006           /* Propagate the MULT expressions to the innermost nodes.  */
8007           else if (GET_CODE (arg0) == PLUS)
8008             {
8009               /* (invar_0 + invar_1) * invar_2.  Distribute.  */
8010               return simplify_giv_expr (loop,
8011                                         gen_rtx_PLUS (mode,
8012                                                       gen_rtx_MULT (mode,
8013                                                                     XEXP (arg0,
8014                                                                           0),
8015                                                                     arg1),
8016                                                       gen_rtx_MULT (mode,
8017                                                                     XEXP (arg0,
8018                                                                           1),
8019                                                                     arg1)),
8020                                         ext_val, benefit);
8021             }
8022           return gen_rtx_USE (mode, gen_rtx_MULT (mode, arg0, arg1));
8023
8024         case MULT:
8025           /* (a * invar_1) * invar_2.  Associate.  */
8026           return simplify_giv_expr (loop,
8027                                     gen_rtx_MULT (mode,
8028                                                   XEXP (arg0, 0),
8029                                                   gen_rtx_MULT (mode,
8030                                                                 XEXP (arg0, 1),
8031                                                                 arg1)),
8032                                     ext_val, benefit);
8033
8034         case PLUS:
8035           /* (a + invar_1) * invar_2.  Distribute.  */
8036           return simplify_giv_expr (loop,
8037                                     gen_rtx_PLUS (mode,
8038                                                   gen_rtx_MULT (mode,
8039                                                                 XEXP (arg0, 0),
8040                                                                 arg1),
8041                                                   gen_rtx_MULT (mode,
8042                                                                 XEXP (arg0, 1),
8043                                                                 arg1)),
8044                                     ext_val, benefit);
8045
8046         default:
8047           gcc_unreachable ();
8048         }
8049
8050     case ASHIFT:
8051       /* Shift by constant is multiply by power of two.  */
8052       if (GET_CODE (XEXP (x, 1)) != CONST_INT)
8053         return 0;
8054
8055       return
8056         simplify_giv_expr (loop,
8057                            gen_rtx_MULT (mode,
8058                                          XEXP (x, 0),
8059                                          GEN_INT ((HOST_WIDE_INT) 1
8060                                                   << INTVAL (XEXP (x, 1)))),
8061                            ext_val, benefit);
8062
8063     case NEG:
8064       /* "-a" is "a * (-1)" */
8065       return simplify_giv_expr (loop,
8066                                 gen_rtx_MULT (mode, XEXP (x, 0), constm1_rtx),
8067                                 ext_val, benefit);
8068
8069     case NOT:
8070       /* "~a" is "-a - 1". Silly, but easy.  */
8071       return simplify_giv_expr (loop,
8072                                 gen_rtx_MINUS (mode,
8073                                                gen_rtx_NEG (mode, XEXP (x, 0)),
8074                                                const1_rtx),
8075                                 ext_val, benefit);
8076
8077     case USE:
8078       /* Already in proper form for invariant.  */
8079       return x;
8080
8081     case SIGN_EXTEND:
8082     case ZERO_EXTEND:
8083     case TRUNCATE:
8084       /* Conditionally recognize extensions of simple IVs.  After we've
8085          computed loop traversal counts and verified the range of the
8086          source IV, we'll reevaluate this as a GIV.  */
8087       if (*ext_val == NULL_RTX)
8088         {
8089           arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
8090           if (arg0 && *ext_val == NULL_RTX && REG_P (arg0))
8091             {
8092               *ext_val = gen_rtx_fmt_e (GET_CODE (x), mode, arg0);
8093               return arg0;
8094             }
8095         }
8096       goto do_default;
8097
8098     case REG:
8099       /* If this is a new register, we can't deal with it.  */
8100       if (REGNO (x) >= max_reg_before_loop)
8101         return 0;
8102
8103       /* Check for biv or giv.  */
8104       switch (REG_IV_TYPE (ivs, REGNO (x)))
8105         {
8106         case BASIC_INDUCT:
8107           return x;
8108         case GENERAL_INDUCT:
8109           {
8110             struct induction *v = REG_IV_INFO (ivs, REGNO (x));
8111
8112             /* Form expression from giv and add benefit.  Ensure this giv
8113                can derive another and subtract any needed adjustment if so.  */
8114
8115             /* Increasing the benefit here is risky.  The only case in which it
8116                is arguably correct is if this is the only use of V.  In other
8117                cases, this will artificially inflate the benefit of the current
8118                giv, and lead to suboptimal code.  Thus, it is disabled, since
8119                potentially not reducing an only marginally beneficial giv is
8120                less harmful than reducing many givs that are not really
8121                beneficial.  */
8122             {
8123               rtx single_use = regs->array[REGNO (x)].single_usage;
8124               if (single_use && single_use != const0_rtx)
8125                 *benefit += v->benefit;
8126             }
8127
8128             if (v->cant_derive)
8129               return 0;
8130
8131             tem = gen_rtx_PLUS (mode, gen_rtx_MULT (mode,
8132                                                     v->src_reg, v->mult_val),
8133                                 v->add_val);
8134
8135             if (v->derive_adjustment)
8136               tem = gen_rtx_MINUS (mode, tem, v->derive_adjustment);
8137             arg0 = simplify_giv_expr (loop, tem, ext_val, benefit);
8138             if (*ext_val)
8139               {
8140                 if (!v->ext_dependent)
8141                   return arg0;
8142               }
8143             else
8144               {
8145                 *ext_val = v->ext_dependent;
8146                 return arg0;
8147               }
8148             return 0;
8149           }
8150
8151         default:
8152         do_default:
8153           /* If it isn't an induction variable, and it is invariant, we
8154              may be able to simplify things further by looking through
8155              the bits we just moved outside the loop.  */
8156           if (loop_invariant_p (loop, x) == 1)
8157             {
8158               struct movable *m;
8159               struct loop_movables *movables = LOOP_MOVABLES (loop);
8160
8161               for (m = movables->head; m; m = m->next)
8162                 if (rtx_equal_p (x, m->set_dest))
8163                   {
8164                     /* Ok, we found a match.  Substitute and simplify.  */
8165
8166                     /* If we match another movable, we must use that, as
8167                        this one is going away.  */
8168                     if (m->match)
8169                       return simplify_giv_expr (loop, m->match->set_dest,
8170                                                 ext_val, benefit);
8171
8172                     /* If consec is nonzero, this is a member of a group of
8173                        instructions that were moved together.  We handle this
8174                        case only to the point of seeking to the last insn and
8175                        looking for a REG_EQUAL.  Fail if we don't find one.  */
8176                     if (m->consec != 0)
8177                       {
8178                         int i = m->consec;
8179                         tem = m->insn;
8180                         do
8181                           {
8182                             tem = NEXT_INSN (tem);
8183                           }
8184                         while (--i > 0);
8185
8186                         tem = find_reg_note (tem, REG_EQUAL, NULL_RTX);
8187                         if (tem)
8188                           tem = XEXP (tem, 0);
8189                       }
8190                     else
8191                       {
8192                         tem = single_set (m->insn);
8193                         if (tem)
8194                           tem = SET_SRC (tem);
8195                       }
8196
8197                     if (tem)
8198                       {
8199                         /* What we are most interested in is pointer
8200                            arithmetic on invariants -- only take
8201                            patterns we may be able to do something with.  */
8202                         if (GET_CODE (tem) == PLUS
8203                             || GET_CODE (tem) == MULT
8204                             || GET_CODE (tem) == ASHIFT
8205                             || GET_CODE (tem) == CONST_INT
8206                             || GET_CODE (tem) == SYMBOL_REF)
8207                           {
8208                             tem = simplify_giv_expr (loop, tem, ext_val,
8209                                                      benefit);
8210                             if (tem)
8211                               return tem;
8212                           }
8213                         else if (GET_CODE (tem) == CONST
8214                                  && GET_CODE (XEXP (tem, 0)) == PLUS
8215                                  && GET_CODE (XEXP (XEXP (tem, 0), 0)) == SYMBOL_REF
8216                                  && GET_CODE (XEXP (XEXP (tem, 0), 1)) == CONST_INT)
8217                           {
8218                             tem = simplify_giv_expr (loop, XEXP (tem, 0),
8219                                                      ext_val, benefit);
8220                             if (tem)
8221                               return tem;
8222                           }
8223                       }
8224                     break;
8225                   }
8226             }
8227           break;
8228         }
8229
8230       /* Fall through to general case.  */
8231     default:
8232       /* If invariant, return as USE (unless CONST_INT).
8233          Otherwise, not giv.  */
8234       if (GET_CODE (x) == USE)
8235         x = XEXP (x, 0);
8236
8237       if (loop_invariant_p (loop, x) == 1)
8238         {
8239           if (GET_CODE (x) == CONST_INT)
8240             return x;
8241           if (GET_CODE (x) == CONST
8242               && GET_CODE (XEXP (x, 0)) == PLUS
8243               && GET_CODE (XEXP (XEXP (x, 0), 0)) == SYMBOL_REF
8244               && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)
8245             x = XEXP (x, 0);
8246           return gen_rtx_USE (mode, x);
8247         }
8248       else
8249         return 0;
8250     }
8251 }
8252
8253 /* This routine folds invariants such that there is only ever one
8254    CONST_INT in the summation.  It is only used by simplify_giv_expr.  */
8255
8256 static rtx
8257 sge_plus_constant (rtx x, rtx c)
8258 {
8259   if (GET_CODE (x) == CONST_INT)
8260     return GEN_INT (INTVAL (x) + INTVAL (c));
8261   else if (GET_CODE (x) != PLUS)
8262     return gen_rtx_PLUS (GET_MODE (x), x, c);
8263   else if (GET_CODE (XEXP (x, 1)) == CONST_INT)
8264     {
8265       return gen_rtx_PLUS (GET_MODE (x), XEXP (x, 0),
8266                            GEN_INT (INTVAL (XEXP (x, 1)) + INTVAL (c)));
8267     }
8268   else if (GET_CODE (XEXP (x, 0)) == PLUS
8269            || GET_CODE (XEXP (x, 1)) != PLUS)
8270     {
8271       return gen_rtx_PLUS (GET_MODE (x),
8272                            sge_plus_constant (XEXP (x, 0), c), XEXP (x, 1));
8273     }
8274   else
8275     {
8276       return gen_rtx_PLUS (GET_MODE (x),
8277                            sge_plus_constant (XEXP (x, 1), c), XEXP (x, 0));
8278     }
8279 }
8280
8281 static rtx
8282 sge_plus (enum machine_mode mode, rtx x, rtx y)
8283 {
8284   while (GET_CODE (y) == PLUS)
8285     {
8286       rtx a = XEXP (y, 0);
8287       if (GET_CODE (a) == CONST_INT)
8288         x = sge_plus_constant (x, a);
8289       else
8290         x = gen_rtx_PLUS (mode, x, a);
8291       y = XEXP (y, 1);
8292     }
8293   if (GET_CODE (y) == CONST_INT)
8294     x = sge_plus_constant (x, y);
8295   else
8296     x = gen_rtx_PLUS (mode, x, y);
8297   return x;
8298 }
8299 \f
8300 /* Help detect a giv that is calculated by several consecutive insns;
8301    for example,
8302       giv = biv * M
8303       giv = giv + A
8304    The caller has already identified the first insn P as having a giv as dest;
8305    we check that all other insns that set the same register follow
8306    immediately after P, that they alter nothing else,
8307    and that the result of the last is still a giv.
8308
8309    The value is 0 if the reg set in P is not really a giv.
8310    Otherwise, the value is the amount gained by eliminating
8311    all the consecutive insns that compute the value.
8312
8313    FIRST_BENEFIT is the amount gained by eliminating the first insn, P.
8314    SRC_REG is the reg of the biv; DEST_REG is the reg of the giv.
8315
8316    The coefficients of the ultimate giv value are stored in
8317    *MULT_VAL and *ADD_VAL.  */
8318
8319 static int
8320 consec_sets_giv (const struct loop *loop, int first_benefit, rtx p,
8321                  rtx src_reg, rtx dest_reg, rtx *add_val, rtx *mult_val,
8322                  rtx *ext_val, rtx *last_consec_insn)
8323 {
8324   struct loop_ivs *ivs = LOOP_IVS (loop);
8325   struct loop_regs *regs = LOOP_REGS (loop);
8326   int count;
8327   enum rtx_code code;
8328   int benefit;
8329   rtx temp;
8330   rtx set;
8331
8332   /* Indicate that this is a giv so that we can update the value produced in
8333      each insn of the multi-insn sequence.
8334
8335      This induction structure will be used only by the call to
8336      general_induction_var below, so we can allocate it on our stack.
8337      If this is a giv, our caller will replace the induct var entry with
8338      a new induction structure.  */
8339   struct induction *v;
8340
8341   if (REG_IV_TYPE (ivs, REGNO (dest_reg)) != UNKNOWN_INDUCT)
8342     return 0;
8343
8344   v = alloca (sizeof (struct induction));
8345   v->src_reg = src_reg;
8346   v->mult_val = *mult_val;
8347   v->add_val = *add_val;
8348   v->benefit = first_benefit;
8349   v->cant_derive = 0;
8350   v->derive_adjustment = 0;
8351   v->ext_dependent = NULL_RTX;
8352
8353   REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
8354   REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
8355
8356   count = regs->array[REGNO (dest_reg)].n_times_set - 1;
8357
8358   while (count > 0)
8359     {
8360       p = NEXT_INSN (p);
8361       code = GET_CODE (p);
8362
8363       /* If libcall, skip to end of call sequence.  */
8364       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
8365         p = XEXP (temp, 0);
8366
8367       if (code == INSN
8368           && (set = single_set (p))
8369           && REG_P (SET_DEST (set))
8370           && SET_DEST (set) == dest_reg
8371           && (general_induction_var (loop, SET_SRC (set), &src_reg,
8372                                      add_val, mult_val, ext_val, 0,
8373                                      &benefit, VOIDmode)
8374               /* Giv created by equivalent expression.  */
8375               || ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX))
8376                   && general_induction_var (loop, XEXP (temp, 0), &src_reg,
8377                                             add_val, mult_val, ext_val, 0,
8378                                             &benefit, VOIDmode)))
8379           && src_reg == v->src_reg)
8380         {
8381           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
8382             benefit += libcall_benefit (p);
8383
8384           count--;
8385           v->mult_val = *mult_val;
8386           v->add_val = *add_val;
8387           v->benefit += benefit;
8388         }
8389       else if (code != NOTE)
8390         {
8391           /* Allow insns that set something other than this giv to a
8392              constant.  Such insns are needed on machines which cannot
8393              include long constants and should not disqualify a giv.  */
8394           if (code == INSN
8395               && (set = single_set (p))
8396               && SET_DEST (set) != dest_reg
8397               && CONSTANT_P (SET_SRC (set)))
8398             continue;
8399
8400           REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
8401           return 0;
8402         }
8403     }
8404
8405   REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
8406   *last_consec_insn = p;
8407   return v->benefit;
8408 }
8409 \f
8410 /* Return an rtx, if any, that expresses giv G2 as a function of the register
8411    represented by G1.  If no such expression can be found, or it is clear that
8412    it cannot possibly be a valid address, 0 is returned.
8413
8414    To perform the computation, we note that
8415         G1 = x * v + a          and
8416         G2 = y * v + b
8417    where `v' is the biv.
8418
8419    So G2 = (y/b) * G1 + (b - a*y/x).
8420
8421    Note that MULT = y/x.
8422
8423    Update: A and B are now allowed to be additive expressions such that
8424    B contains all variables in A.  That is, computing B-A will not require
8425    subtracting variables.  */
8426
8427 static rtx
8428 express_from_1 (rtx a, rtx b, rtx mult)
8429 {
8430   /* If MULT is zero, then A*MULT is zero, and our expression is B.  */
8431
8432   if (mult == const0_rtx)
8433     return b;
8434
8435   /* If MULT is not 1, we cannot handle A with non-constants, since we
8436      would then be required to subtract multiples of the registers in A.
8437      This is theoretically possible, and may even apply to some Fortran
8438      constructs, but it is a lot of work and we do not attempt it here.  */
8439
8440   if (mult != const1_rtx && GET_CODE (a) != CONST_INT)
8441     return NULL_RTX;
8442
8443   /* In general these structures are sorted top to bottom (down the PLUS
8444      chain), but not left to right across the PLUS.  If B is a higher
8445      order giv than A, we can strip one level and recurse.  If A is higher
8446      order, we'll eventually bail out, but won't know that until the end.
8447      If they are the same, we'll strip one level around this loop.  */
8448
8449   while (GET_CODE (a) == PLUS && GET_CODE (b) == PLUS)
8450     {
8451       rtx ra, rb, oa, ob, tmp;
8452
8453       ra = XEXP (a, 0), oa = XEXP (a, 1);
8454       if (GET_CODE (ra) == PLUS)
8455         tmp = ra, ra = oa, oa = tmp;
8456
8457       rb = XEXP (b, 0), ob = XEXP (b, 1);
8458       if (GET_CODE (rb) == PLUS)
8459         tmp = rb, rb = ob, ob = tmp;
8460
8461       if (rtx_equal_p (ra, rb))
8462         /* We matched: remove one reg completely.  */
8463         a = oa, b = ob;
8464       else if (GET_CODE (ob) != PLUS && rtx_equal_p (ra, ob))
8465         /* An alternate match.  */
8466         a = oa, b = rb;
8467       else if (GET_CODE (oa) != PLUS && rtx_equal_p (oa, rb))
8468         /* An alternate match.  */
8469         a = ra, b = ob;
8470       else
8471         {
8472           /* Indicates an extra register in B.  Strip one level from B and
8473              recurse, hoping B was the higher order expression.  */
8474           ob = express_from_1 (a, ob, mult);
8475           if (ob == NULL_RTX)
8476             return NULL_RTX;
8477           return gen_rtx_PLUS (GET_MODE (b), rb, ob);
8478         }
8479     }
8480
8481   /* Here we are at the last level of A, go through the cases hoping to
8482      get rid of everything but a constant.  */
8483
8484   if (GET_CODE (a) == PLUS)
8485     {
8486       rtx ra, oa;
8487
8488       ra = XEXP (a, 0), oa = XEXP (a, 1);
8489       if (rtx_equal_p (oa, b))
8490         oa = ra;
8491       else if (!rtx_equal_p (ra, b))
8492         return NULL_RTX;
8493
8494       if (GET_CODE (oa) != CONST_INT)
8495         return NULL_RTX;
8496
8497       return GEN_INT (-INTVAL (oa) * INTVAL (mult));
8498     }
8499   else if (GET_CODE (a) == CONST_INT)
8500     {
8501       return plus_constant (b, -INTVAL (a) * INTVAL (mult));
8502     }
8503   else if (CONSTANT_P (a))
8504     {
8505       enum machine_mode mode_a = GET_MODE (a);
8506       enum machine_mode mode_b = GET_MODE (b);
8507       enum machine_mode mode = mode_b == VOIDmode ? mode_a : mode_b;
8508       return simplify_gen_binary (MINUS, mode, b, a);
8509     }
8510   else if (GET_CODE (b) == PLUS)
8511     {
8512       if (rtx_equal_p (a, XEXP (b, 0)))
8513         return XEXP (b, 1);
8514       else if (rtx_equal_p (a, XEXP (b, 1)))
8515         return XEXP (b, 0);
8516       else
8517         return NULL_RTX;
8518     }
8519   else if (rtx_equal_p (a, b))
8520     return const0_rtx;
8521
8522   return NULL_RTX;
8523 }
8524
8525 static rtx
8526 express_from (struct induction *g1, struct induction *g2)
8527 {
8528   rtx mult, add;
8529
8530   /* The value that G1 will be multiplied by must be a constant integer.  Also,
8531      the only chance we have of getting a valid address is if b*c/a (see above
8532      for notation) is also an integer.  */
8533   if (GET_CODE (g1->mult_val) == CONST_INT
8534       && GET_CODE (g2->mult_val) == CONST_INT)
8535     {
8536       if (g1->mult_val == const0_rtx
8537           || (g1->mult_val == constm1_rtx
8538               && INTVAL (g2->mult_val)
8539                  == (HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT - 1))
8540           || INTVAL (g2->mult_val) % INTVAL (g1->mult_val) != 0)
8541         return NULL_RTX;
8542       mult = GEN_INT (INTVAL (g2->mult_val) / INTVAL (g1->mult_val));
8543     }
8544   else if (rtx_equal_p (g1->mult_val, g2->mult_val))
8545     mult = const1_rtx;
8546   else
8547     {
8548       /* ??? Find out if the one is a multiple of the other?  */
8549       return NULL_RTX;
8550     }
8551
8552   add = express_from_1 (g1->add_val, g2->add_val, mult);
8553   if (add == NULL_RTX)
8554     {
8555       /* Failed.  If we've got a multiplication factor between G1 and G2,
8556          scale G1's addend and try again.  */
8557       if (INTVAL (mult) > 1)
8558         {
8559           rtx g1_add_val = g1->add_val;
8560           if (GET_CODE (g1_add_val) == MULT
8561               && GET_CODE (XEXP (g1_add_val, 1)) == CONST_INT)
8562             {
8563               HOST_WIDE_INT m;
8564               m = INTVAL (mult) * INTVAL (XEXP (g1_add_val, 1));
8565               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val),
8566                                          XEXP (g1_add_val, 0), GEN_INT (m));
8567             }
8568           else
8569             {
8570               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val), g1_add_val,
8571                                          mult);
8572             }
8573
8574           add = express_from_1 (g1_add_val, g2->add_val, const1_rtx);
8575         }
8576     }
8577   if (add == NULL_RTX)
8578     return NULL_RTX;
8579
8580   /* Form simplified final result.  */
8581   if (mult == const0_rtx)
8582     return add;
8583   else if (mult == const1_rtx)
8584     mult = g1->dest_reg;
8585   else
8586     mult = gen_rtx_MULT (g2->mode, g1->dest_reg, mult);
8587
8588   if (add == const0_rtx)
8589     return mult;
8590   else
8591     {
8592       if (GET_CODE (add) == PLUS
8593           && CONSTANT_P (XEXP (add, 1)))
8594         {
8595           rtx tem = XEXP (add, 1);
8596           mult = gen_rtx_PLUS (g2->mode, mult, XEXP (add, 0));
8597           add = tem;
8598         }
8599
8600       return gen_rtx_PLUS (g2->mode, mult, add);
8601     }
8602 }
8603 \f
8604 /* Return an rtx, if any, that expresses giv G2 as a function of the register
8605    represented by G1.  This indicates that G2 should be combined with G1 and
8606    that G2 can use (either directly or via an address expression) a register
8607    used to represent G1.  */
8608
8609 static rtx
8610 combine_givs_p (struct induction *g1, struct induction *g2)
8611 {
8612   rtx comb, ret;
8613
8614   /* With the introduction of ext dependent givs, we must care for modes.
8615      G2 must not use a wider mode than G1.  */
8616   if (GET_MODE_SIZE (g1->mode) < GET_MODE_SIZE (g2->mode))
8617     return NULL_RTX;
8618
8619   ret = comb = express_from (g1, g2);
8620   if (comb == NULL_RTX)
8621     return NULL_RTX;
8622   if (g1->mode != g2->mode)
8623     ret = gen_lowpart (g2->mode, comb);
8624
8625   /* If these givs are identical, they can be combined.  We use the results
8626      of express_from because the addends are not in a canonical form, so
8627      rtx_equal_p is a weaker test.  */
8628   /* But don't combine a DEST_REG giv with a DEST_ADDR giv; we want the
8629      combination to be the other way round.  */
8630   if (comb == g1->dest_reg
8631       && (g1->giv_type == DEST_REG || g2->giv_type == DEST_ADDR))
8632     {
8633       return ret;
8634     }
8635
8636   /* If G2 can be expressed as a function of G1 and that function is valid
8637      as an address and no more expensive than using a register for G2,
8638      the expression of G2 in terms of G1 can be used.  */
8639   if (ret != NULL_RTX
8640       && g2->giv_type == DEST_ADDR
8641       && memory_address_p (GET_MODE (g2->mem), ret))
8642     return ret;
8643
8644   return NULL_RTX;
8645 }
8646 \f
8647 /* See if BL is monotonic and has a constant per-iteration increment.
8648    Return the increment if so, otherwise return 0.  */
8649
8650 static HOST_WIDE_INT
8651 get_monotonic_increment (struct iv_class *bl)
8652 {
8653   struct induction *v;
8654   rtx incr;
8655
8656   /* Get the total increment and check that it is constant.  */
8657   incr = biv_total_increment (bl);
8658   if (incr == 0 || GET_CODE (incr) != CONST_INT)
8659     return 0;
8660
8661   for (v = bl->biv; v != 0; v = v->next_iv)
8662     {
8663       if (GET_CODE (v->add_val) != CONST_INT)
8664         return 0;
8665
8666       if (INTVAL (v->add_val) < 0 && INTVAL (incr) >= 0)
8667         return 0;
8668
8669       if (INTVAL (v->add_val) > 0 && INTVAL (incr) <= 0)
8670         return 0;
8671     }
8672   return INTVAL (incr);
8673 }
8674
8675
8676 /* Subroutine of biv_fits_mode_p.  Return true if biv BL, when biased by
8677    BIAS, will never exceed the unsigned range of MODE.  LOOP is the loop
8678    to which the biv belongs and INCR is its per-iteration increment.  */
8679
8680 static bool
8681 biased_biv_fits_mode_p (const struct loop *loop, struct iv_class *bl,
8682                         HOST_WIDE_INT incr, enum machine_mode mode,
8683                         unsigned HOST_WIDE_INT bias)
8684 {
8685   unsigned HOST_WIDE_INT initial, maximum, span, delta;
8686
8687   /* We need to be able to manipulate MODE-size constants.  */
8688   if (HOST_BITS_PER_WIDE_INT < GET_MODE_BITSIZE (mode))
8689     return false;
8690
8691   /* The number of loop iterations must be constant.  */
8692   if (LOOP_INFO (loop)->n_iterations == 0)
8693     return false;
8694
8695   /* So must the biv's initial value.  */
8696   if (bl->initial_value == 0 || GET_CODE (bl->initial_value) != CONST_INT)
8697     return false;
8698
8699   initial = bias + INTVAL (bl->initial_value);
8700   maximum = GET_MODE_MASK (mode);
8701
8702   /* Make sure that the initial value is within range.  */
8703   if (initial > maximum)
8704     return false;
8705
8706   /* Set up DELTA and SPAN such that the number of iterations * DELTA
8707      (calculated to arbitrary precision) must be <= SPAN.  */
8708   if (incr < 0)
8709     {
8710       delta = -incr;
8711       span = initial;
8712     }
8713   else
8714     {
8715       delta = incr;
8716       /* Handle the special case in which MAXIMUM is the largest
8717          unsigned HOST_WIDE_INT and INITIAL is 0.  */
8718       if (maximum + 1 == initial)
8719         span = LOOP_INFO (loop)->n_iterations * delta;
8720       else
8721         span = maximum + 1 - initial;
8722     }
8723   return (span / LOOP_INFO (loop)->n_iterations >= delta);
8724 }
8725
8726
8727 /* Return true if biv BL will never exceed the bounds of MODE.  LOOP is
8728    the loop to which BL belongs and INCR is its per-iteration increment.
8729    UNSIGNEDP is true if the biv should be treated as unsigned.  */
8730
8731 static bool
8732 biv_fits_mode_p (const struct loop *loop, struct iv_class *bl,
8733                  HOST_WIDE_INT incr, enum machine_mode mode, bool unsignedp)
8734 {
8735   struct loop_info *loop_info;
8736   unsigned HOST_WIDE_INT bias;
8737
8738   /* A biv's value will always be limited to its natural mode.
8739      Larger modes will observe the same wrap-around.  */
8740   if (GET_MODE_SIZE (mode) > GET_MODE_SIZE (GET_MODE (bl->biv->src_reg)))
8741     mode = GET_MODE (bl->biv->src_reg);
8742
8743   loop_info = LOOP_INFO (loop);
8744
8745   bias = (unsignedp ? 0 : (GET_MODE_MASK (mode) >> 1) + 1);
8746   if (biased_biv_fits_mode_p (loop, bl, incr, mode, bias))
8747     return true;
8748
8749   if (mode == GET_MODE (bl->biv->src_reg)
8750       && bl->biv->src_reg == loop_info->iteration_var
8751       && loop_info->comparison_value
8752       && loop_invariant_p (loop, loop_info->comparison_value))
8753     {
8754       /* If the increment is +1, and the exit test is a <, the BIV
8755          cannot overflow.  (For <=, we have the problematic case that
8756          the comparison value might be the maximum value of the range.)  */
8757       if (incr == 1)
8758         {
8759           if (loop_info->comparison_code == LT)
8760             return true;
8761           if (loop_info->comparison_code == LTU && unsignedp)
8762             return true;
8763         }
8764
8765       /* Likewise for increment -1 and exit test >.  */
8766       if (incr == -1)
8767         {
8768           if (loop_info->comparison_code == GT)
8769             return true;
8770           if (loop_info->comparison_code == GTU && unsignedp)
8771             return true;
8772         }
8773     }
8774   return false;
8775 }
8776
8777
8778 /* Given that X is an extension or truncation of BL, return true
8779    if it is unaffected by overflow.  LOOP is the loop to which
8780    BL belongs and INCR is its per-iteration increment.  */
8781
8782 static bool
8783 extension_within_bounds_p (const struct loop *loop, struct iv_class *bl,
8784                            HOST_WIDE_INT incr, rtx x)
8785 {
8786   enum machine_mode mode;
8787   bool signedp, unsignedp;
8788
8789   switch (GET_CODE (x))
8790     {
8791     case SIGN_EXTEND:
8792     case ZERO_EXTEND:
8793       mode = GET_MODE (XEXP (x, 0));
8794       signedp = (GET_CODE (x) == SIGN_EXTEND);
8795       unsignedp = (GET_CODE (x) == ZERO_EXTEND);
8796       break;
8797
8798     case TRUNCATE:
8799       /* We don't know whether this value is being used as signed
8800          or unsigned, so check the conditions for both.  */
8801       mode = GET_MODE (x);
8802       signedp = unsignedp = true;
8803       break;
8804
8805     default:
8806       gcc_unreachable ();
8807     }
8808
8809   return ((!signedp || biv_fits_mode_p (loop, bl, incr, mode, false))
8810           && (!unsignedp || biv_fits_mode_p (loop, bl, incr, mode, true)));
8811 }
8812
8813
8814 /* Check each extension dependent giv in this class to see if its
8815    root biv is safe from wrapping in the interior mode, which would
8816    make the giv illegal.  */
8817
8818 static void
8819 check_ext_dependent_givs (const struct loop *loop, struct iv_class *bl)
8820 {
8821   struct induction *v;
8822   HOST_WIDE_INT incr;
8823
8824   incr = get_monotonic_increment (bl);
8825
8826   /* Invalidate givs that fail the tests.  */
8827   for (v = bl->giv; v; v = v->next_iv)
8828     if (v->ext_dependent)
8829       {
8830         if (incr != 0
8831             && extension_within_bounds_p (loop, bl, incr, v->ext_dependent))
8832           {
8833             if (loop_dump_stream)
8834               fprintf (loop_dump_stream,
8835                        "Verified ext dependent giv at %d of reg %d\n",
8836                        INSN_UID (v->insn), bl->regno);
8837           }
8838         else
8839           {
8840             if (loop_dump_stream)
8841               fprintf (loop_dump_stream,
8842                        "Failed ext dependent giv at %d\n",
8843                        INSN_UID (v->insn));
8844
8845             v->ignore = 1;
8846             bl->all_reduced = 0;
8847           }
8848       }
8849 }
8850
8851 /* Generate a version of VALUE in a mode appropriate for initializing V.  */
8852
8853 static rtx
8854 extend_value_for_giv (struct induction *v, rtx value)
8855 {
8856   rtx ext_dep = v->ext_dependent;
8857
8858   if (! ext_dep)
8859     return value;
8860
8861   /* Recall that check_ext_dependent_givs verified that the known bounds
8862      of a biv did not overflow or wrap with respect to the extension for
8863      the giv.  Therefore, constants need no additional adjustment.  */
8864   if (CONSTANT_P (value) && GET_MODE (value) == VOIDmode)
8865     return value;
8866
8867   /* Otherwise, we must adjust the value to compensate for the
8868      differing modes of the biv and the giv.  */
8869   return gen_rtx_fmt_e (GET_CODE (ext_dep), GET_MODE (ext_dep), value);
8870 }
8871 \f
8872 struct combine_givs_stats
8873 {
8874   int giv_number;
8875   int total_benefit;
8876 };
8877
8878 static int
8879 cmp_combine_givs_stats (const void *xp, const void *yp)
8880 {
8881   const struct combine_givs_stats * const x =
8882     (const struct combine_givs_stats *) xp;
8883   const struct combine_givs_stats * const y =
8884     (const struct combine_givs_stats *) yp;
8885   int d;
8886   d = y->total_benefit - x->total_benefit;
8887   /* Stabilize the sort.  */
8888   if (!d)
8889     d = x->giv_number - y->giv_number;
8890   return d;
8891 }
8892
8893 /* Check all pairs of givs for iv_class BL and see if any can be combined with
8894    any other.  If so, point SAME to the giv combined with and set NEW_REG to
8895    be an expression (in terms of the other giv's DEST_REG) equivalent to the
8896    giv.  Also, update BENEFIT and related fields for cost/benefit analysis.  */
8897
8898 static void
8899 combine_givs (struct loop_regs *regs, struct iv_class *bl)
8900 {
8901   /* Additional benefit to add for being combined multiple times.  */
8902   const int extra_benefit = 3;
8903
8904   struct induction *g1, *g2, **giv_array;
8905   int i, j, k, giv_count;
8906   struct combine_givs_stats *stats;
8907   rtx *can_combine;
8908
8909   /* Count givs, because bl->giv_count is incorrect here.  */
8910   giv_count = 0;
8911   for (g1 = bl->giv; g1; g1 = g1->next_iv)
8912     if (!g1->ignore)
8913       giv_count++;
8914
8915   giv_array = alloca (giv_count * sizeof (struct induction *));
8916   i = 0;
8917   for (g1 = bl->giv; g1; g1 = g1->next_iv)
8918     if (!g1->ignore)
8919       giv_array[i++] = g1;
8920
8921   stats = xcalloc (giv_count, sizeof (*stats));
8922   can_combine = xcalloc (giv_count, giv_count * sizeof (rtx));
8923
8924   for (i = 0; i < giv_count; i++)
8925     {
8926       int this_benefit;
8927       rtx single_use;
8928
8929       g1 = giv_array[i];
8930       stats[i].giv_number = i;
8931
8932       /* If a DEST_REG GIV is used only once, do not allow it to combine
8933          with anything, for in doing so we will gain nothing that cannot
8934          be had by simply letting the GIV with which we would have combined
8935          to be reduced on its own.  The lossage shows up in particular with
8936          DEST_ADDR targets on hosts with reg+reg addressing, though it can
8937          be seen elsewhere as well.  */
8938       if (g1->giv_type == DEST_REG
8939           && (single_use = regs->array[REGNO (g1->dest_reg)].single_usage)
8940           && single_use != const0_rtx)
8941         continue;
8942
8943       this_benefit = g1->benefit;
8944       /* Add an additional weight for zero addends.  */
8945       if (g1->no_const_addval)
8946         this_benefit += 1;
8947
8948       for (j = 0; j < giv_count; j++)
8949         {
8950           rtx this_combine;
8951
8952           g2 = giv_array[j];
8953           if (g1 != g2
8954               && (this_combine = combine_givs_p (g1, g2)) != NULL_RTX)
8955             {
8956               can_combine[i * giv_count + j] = this_combine;
8957               this_benefit += g2->benefit + extra_benefit;
8958             }
8959         }
8960       stats[i].total_benefit = this_benefit;
8961     }
8962
8963   /* Iterate, combining until we can't.  */
8964 restart:
8965   qsort (stats, giv_count, sizeof (*stats), cmp_combine_givs_stats);
8966
8967   if (loop_dump_stream)
8968     {
8969       fprintf (loop_dump_stream, "Sorted combine statistics:\n");
8970       for (k = 0; k < giv_count; k++)
8971         {
8972           g1 = giv_array[stats[k].giv_number];
8973           if (!g1->combined_with && !g1->same)
8974             fprintf (loop_dump_stream, " {%d, %d}",
8975                      INSN_UID (giv_array[stats[k].giv_number]->insn),
8976                      stats[k].total_benefit);
8977         }
8978       putc ('\n', loop_dump_stream);
8979     }
8980
8981   for (k = 0; k < giv_count; k++)
8982     {
8983       int g1_add_benefit = 0;
8984
8985       i = stats[k].giv_number;
8986       g1 = giv_array[i];
8987
8988       /* If it has already been combined, skip.  */
8989       if (g1->combined_with || g1->same)
8990         continue;
8991
8992       for (j = 0; j < giv_count; j++)
8993         {
8994           g2 = giv_array[j];
8995           if (g1 != g2 && can_combine[i * giv_count + j]
8996               /* If it has already been combined, skip.  */
8997               && ! g2->same && ! g2->combined_with)
8998             {
8999               int l;
9000
9001               g2->new_reg = can_combine[i * giv_count + j];
9002               g2->same = g1;
9003               /* For destination, we now may replace by mem expression instead
9004                  of register.  This changes the costs considerably, so add the
9005                  compensation.  */
9006               if (g2->giv_type == DEST_ADDR)
9007                 g2->benefit = (g2->benefit + reg_address_cost
9008                                - address_cost (g2->new_reg,
9009                                GET_MODE (g2->mem)));
9010               g1->combined_with++;
9011               g1->lifetime += g2->lifetime;
9012
9013               g1_add_benefit += g2->benefit;
9014
9015               /* ??? The new final_[bg]iv_value code does a much better job
9016                  of finding replaceable giv's, and hence this code may no
9017                  longer be necessary.  */
9018               if (! g2->replaceable && REG_USERVAR_P (g2->dest_reg))
9019                 g1_add_benefit -= copy_cost;
9020
9021               /* To help optimize the next set of combinations, remove
9022                  this giv from the benefits of other potential mates.  */
9023               for (l = 0; l < giv_count; ++l)
9024                 {
9025                   int m = stats[l].giv_number;
9026                   if (can_combine[m * giv_count + j])
9027                     stats[l].total_benefit -= g2->benefit + extra_benefit;
9028                 }
9029
9030               if (loop_dump_stream)
9031                 fprintf (loop_dump_stream,
9032                          "giv at %d combined with giv at %d; new benefit %d + %d, lifetime %d\n",
9033                          INSN_UID (g2->insn), INSN_UID (g1->insn),
9034                          g1->benefit, g1_add_benefit, g1->lifetime);
9035             }
9036         }
9037
9038       /* To help optimize the next set of combinations, remove
9039          this giv from the benefits of other potential mates.  */
9040       if (g1->combined_with)
9041         {
9042           for (j = 0; j < giv_count; ++j)
9043             {
9044               int m = stats[j].giv_number;
9045               if (can_combine[m * giv_count + i])
9046                 stats[j].total_benefit -= g1->benefit + extra_benefit;
9047             }
9048
9049           g1->benefit += g1_add_benefit;
9050
9051           /* We've finished with this giv, and everything it touched.
9052              Restart the combination so that proper weights for the
9053              rest of the givs are properly taken into account.  */
9054           /* ??? Ideally we would compact the arrays at this point, so
9055              as to not cover old ground.  But sanely compacting
9056              can_combine is tricky.  */
9057           goto restart;
9058         }
9059     }
9060
9061   /* Clean up.  */
9062   free (stats);
9063   free (can_combine);
9064 }
9065 \f
9066 /* Generate sequence for REG = B * M + A.  B is the initial value of
9067    the basic induction variable, M a multiplicative constant, A an
9068    additive constant and REG the destination register.  */
9069
9070 static rtx
9071 gen_add_mult (rtx b,  rtx m, rtx a, rtx reg)
9072 {
9073   rtx seq;
9074   rtx result;
9075
9076   start_sequence ();
9077   /* Use unsigned arithmetic.  */
9078   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
9079   if (reg != result)
9080     emit_move_insn (reg, result);
9081   seq = get_insns ();
9082   end_sequence ();
9083
9084   return seq;
9085 }
9086
9087
9088 /* Update registers created in insn sequence SEQ.  */
9089
9090 static void
9091 loop_regs_update (const struct loop *loop ATTRIBUTE_UNUSED, rtx seq)
9092 {
9093   rtx insn;
9094
9095   /* Update register info for alias analysis.  */
9096
9097   insn = seq;
9098   while (insn != NULL_RTX)
9099     {
9100       rtx set = single_set (insn);
9101
9102       if (set && REG_P (SET_DEST (set)))
9103         record_base_value (REGNO (SET_DEST (set)), SET_SRC (set), 0);
9104
9105       insn = NEXT_INSN (insn);
9106     }
9107 }
9108
9109
9110 /* EMIT code before BEFORE_BB/BEFORE_INSN to set REG = B * M + A.  B
9111    is the initial value of the basic induction variable, M a
9112    multiplicative constant, A an additive constant and REG the
9113    destination register.  */
9114
9115 static void
9116 loop_iv_add_mult_emit_before (const struct loop *loop, rtx b, rtx m, rtx a,
9117                               rtx reg, basic_block before_bb, rtx before_insn)
9118 {
9119   rtx seq;
9120
9121   if (! before_insn)
9122     {
9123       loop_iv_add_mult_hoist (loop, b, m, a, reg);
9124       return;
9125     }
9126
9127   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
9128   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
9129
9130   /* Increase the lifetime of any invariants moved further in code.  */
9131   update_reg_last_use (a, before_insn);
9132   update_reg_last_use (b, before_insn);
9133   update_reg_last_use (m, before_insn);
9134
9135   /* It is possible that the expansion created lots of new registers.
9136      Iterate over the sequence we just created and record them all.  We
9137      must do this before inserting the sequence.  */
9138   loop_regs_update (loop, seq);
9139
9140   loop_insn_emit_before (loop, before_bb, before_insn, seq);
9141 }
9142
9143
9144 /* Emit insns in loop pre-header to set REG = B * M + A.  B is the
9145    initial value of the basic induction variable, M a multiplicative
9146    constant, A an additive constant and REG the destination
9147    register.  */
9148
9149 static void
9150 loop_iv_add_mult_sink (const struct loop *loop, rtx b, rtx m, rtx a, rtx reg)
9151 {
9152   rtx seq;
9153
9154   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
9155   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
9156
9157   /* Increase the lifetime of any invariants moved further in code.
9158      ???? Is this really necessary?  */
9159   update_reg_last_use (a, loop->sink);
9160   update_reg_last_use (b, loop->sink);
9161   update_reg_last_use (m, loop->sink);
9162
9163   /* It is possible that the expansion created lots of new registers.
9164      Iterate over the sequence we just created and record them all.  We
9165      must do this before inserting the sequence.  */
9166   loop_regs_update (loop, seq);
9167
9168   loop_insn_sink (loop, seq);
9169 }
9170
9171
9172 /* Emit insns after loop to set REG = B * M + A.  B is the initial
9173    value of the basic induction variable, M a multiplicative constant,
9174    A an additive constant and REG the destination register.  */
9175
9176 static void
9177 loop_iv_add_mult_hoist (const struct loop *loop, rtx b, rtx m, rtx a, rtx reg)
9178 {
9179   rtx seq;
9180
9181   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
9182   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
9183
9184   /* It is possible that the expansion created lots of new registers.
9185      Iterate over the sequence we just created and record them all.  We
9186      must do this before inserting the sequence.  */
9187   loop_regs_update (loop, seq);
9188
9189   loop_insn_hoist (loop, seq);
9190 }
9191
9192
9193
9194 /* Similar to gen_add_mult, but compute cost rather than generating
9195    sequence.  */
9196
9197 static int
9198 iv_add_mult_cost (rtx b, rtx m, rtx a, rtx reg)
9199 {
9200   int cost = 0;
9201   rtx last, result;
9202
9203   start_sequence ();
9204   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
9205   if (reg != result)
9206     emit_move_insn (reg, result);
9207   last = get_last_insn ();
9208   while (last)
9209     {
9210       rtx t = single_set (last);
9211       if (t)
9212         cost += rtx_cost (SET_SRC (t), SET);
9213       last = PREV_INSN (last);
9214     }
9215   end_sequence ();
9216   return cost;
9217 }
9218 \f
9219 /* Test whether A * B can be computed without
9220    an actual multiply insn.  Value is 1 if so.
9221
9222   ??? This function stinks because it generates a ton of wasted RTL
9223   ??? and as a result fragments GC memory to no end.  There are other
9224   ??? places in the compiler which are invoked a lot and do the same
9225   ??? thing, generate wasted RTL just to see if something is possible.  */
9226
9227 static int
9228 product_cheap_p (rtx a, rtx b)
9229 {
9230   rtx tmp;
9231   int win, n_insns;
9232
9233   /* If only one is constant, make it B.  */
9234   if (GET_CODE (a) == CONST_INT)
9235     tmp = a, a = b, b = tmp;
9236
9237   /* If first constant, both constant, so don't need multiply.  */
9238   if (GET_CODE (a) == CONST_INT)
9239     return 1;
9240
9241   /* If second not constant, neither is constant, so would need multiply.  */
9242   if (GET_CODE (b) != CONST_INT)
9243     return 0;
9244
9245   /* One operand is constant, so might not need multiply insn.  Generate the
9246      code for the multiply and see if a call or multiply, or long sequence
9247      of insns is generated.  */
9248
9249   start_sequence ();
9250   expand_mult (GET_MODE (a), a, b, NULL_RTX, 1);
9251   tmp = get_insns ();
9252   end_sequence ();
9253
9254   win = 1;
9255   if (tmp == NULL_RTX)
9256     ;
9257   else if (INSN_P (tmp))
9258     {
9259       n_insns = 0;
9260       while (tmp != NULL_RTX)
9261         {
9262           rtx next = NEXT_INSN (tmp);
9263
9264           if (++n_insns > 3
9265               || !NONJUMP_INSN_P (tmp)
9266               || (GET_CODE (PATTERN (tmp)) == SET
9267                   && GET_CODE (SET_SRC (PATTERN (tmp))) == MULT)
9268               || (GET_CODE (PATTERN (tmp)) == PARALLEL
9269                   && GET_CODE (XVECEXP (PATTERN (tmp), 0, 0)) == SET
9270                   && GET_CODE (SET_SRC (XVECEXP (PATTERN (tmp), 0, 0))) == MULT))
9271             {
9272               win = 0;
9273               break;
9274             }
9275
9276           tmp = next;
9277         }
9278     }
9279   else if (GET_CODE (tmp) == SET
9280            && GET_CODE (SET_SRC (tmp)) == MULT)
9281     win = 0;
9282   else if (GET_CODE (tmp) == PARALLEL
9283            && GET_CODE (XVECEXP (tmp, 0, 0)) == SET
9284            && GET_CODE (SET_SRC (XVECEXP (tmp, 0, 0))) == MULT)
9285     win = 0;
9286
9287   return win;
9288 }
9289 \f
9290 /* Check to see if loop can be terminated by a "decrement and branch until
9291    zero" instruction.  If so, add a REG_NONNEG note to the branch insn if so.
9292    Also try reversing an increment loop to a decrement loop
9293    to see if the optimization can be performed.
9294    Value is nonzero if optimization was performed.  */
9295
9296 /* This is useful even if the architecture doesn't have such an insn,
9297    because it might change a loops which increments from 0 to n to a loop
9298    which decrements from n to 0.  A loop that decrements to zero is usually
9299    faster than one that increments from zero.  */
9300
9301 /* ??? This could be rewritten to use some of the loop unrolling procedures,
9302    such as approx_final_value, biv_total_increment, loop_iterations, and
9303    final_[bg]iv_value.  */
9304
9305 static int
9306 check_dbra_loop (struct loop *loop, int insn_count)
9307 {
9308   struct loop_info *loop_info = LOOP_INFO (loop);
9309   struct loop_regs *regs = LOOP_REGS (loop);
9310   struct loop_ivs *ivs = LOOP_IVS (loop);
9311   struct iv_class *bl;
9312   rtx reg;
9313   enum machine_mode mode;
9314   rtx jump_label;
9315   rtx final_value;
9316   rtx start_value;
9317   rtx new_add_val;
9318   rtx comparison;
9319   rtx before_comparison;
9320   rtx p;
9321   rtx jump;
9322   rtx first_compare;
9323   int compare_and_branch;
9324   rtx loop_start = loop->start;
9325   rtx loop_end = loop->end;
9326
9327   /* If last insn is a conditional branch, and the insn before tests a
9328      register value, try to optimize it.  Otherwise, we can't do anything.  */
9329
9330   jump = PREV_INSN (loop_end);
9331   comparison = get_condition_for_loop (loop, jump);
9332   if (comparison == 0)
9333     return 0;
9334   if (!onlyjump_p (jump))
9335     return 0;
9336
9337   /* Try to compute whether the compare/branch at the loop end is one or
9338      two instructions.  */
9339   get_condition (jump, &first_compare, false, true);
9340   if (first_compare == jump)
9341     compare_and_branch = 1;
9342   else if (first_compare == prev_nonnote_insn (jump))
9343     compare_and_branch = 2;
9344   else
9345     return 0;
9346
9347   {
9348     /* If more than one condition is present to control the loop, then
9349        do not proceed, as this function does not know how to rewrite
9350        loop tests with more than one condition.
9351
9352        Look backwards from the first insn in the last comparison
9353        sequence and see if we've got another comparison sequence.  */
9354
9355     rtx jump1;
9356     if ((jump1 = prev_nonnote_insn (first_compare))
9357         && JUMP_P (jump1))
9358         return 0;
9359   }
9360
9361   /* Check all of the bivs to see if the compare uses one of them.
9362      Skip biv's set more than once because we can't guarantee that
9363      it will be zero on the last iteration.  Also skip if the biv is
9364      used between its update and the test insn.  */
9365
9366   for (bl = ivs->list; bl; bl = bl->next)
9367     {
9368       if (bl->biv_count == 1
9369           && ! bl->biv->maybe_multiple
9370           && bl->biv->dest_reg == XEXP (comparison, 0)
9371           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
9372                                    first_compare))
9373         break;
9374     }
9375
9376   /* Try swapping the comparison to identify a suitable biv.  */
9377   if (!bl)
9378     for (bl = ivs->list; bl; bl = bl->next)
9379       if (bl->biv_count == 1
9380           && ! bl->biv->maybe_multiple
9381           && bl->biv->dest_reg == XEXP (comparison, 1)
9382           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
9383                                    first_compare))
9384         {
9385           comparison = gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)),
9386                                        VOIDmode,
9387                                        XEXP (comparison, 1),
9388                                        XEXP (comparison, 0));
9389           break;
9390         }
9391
9392   if (! bl)
9393     return 0;
9394
9395   /* Look for the case where the basic induction variable is always
9396      nonnegative, and equals zero on the last iteration.
9397      In this case, add a reg_note REG_NONNEG, which allows the
9398      m68k DBRA instruction to be used.  */
9399
9400   if (((GET_CODE (comparison) == GT && XEXP (comparison, 1) == constm1_rtx)
9401        || (GET_CODE (comparison) == NE && XEXP (comparison, 1) == const0_rtx))
9402       && GET_CODE (bl->biv->add_val) == CONST_INT
9403       && INTVAL (bl->biv->add_val) < 0)
9404     {
9405       /* Initial value must be greater than 0,
9406          init_val % -dec_value == 0 to ensure that it equals zero on
9407          the last iteration */
9408
9409       if (GET_CODE (bl->initial_value) == CONST_INT
9410           && INTVAL (bl->initial_value) > 0
9411           && (INTVAL (bl->initial_value)
9412               % (-INTVAL (bl->biv->add_val))) == 0)
9413         {
9414           /* Register always nonnegative, add REG_NOTE to branch.  */
9415           if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
9416             REG_NOTES (jump)
9417               = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
9418                                    REG_NOTES (jump));
9419           bl->nonneg = 1;
9420
9421           return 1;
9422         }
9423
9424       /* If the decrement is 1 and the value was tested as >= 0 before
9425          the loop, then we can safely optimize.  */
9426       for (p = loop_start; p; p = PREV_INSN (p))
9427         {
9428           if (LABEL_P (p))
9429             break;
9430           if (!JUMP_P (p))
9431             continue;
9432
9433           before_comparison = get_condition_for_loop (loop, p);
9434           if (before_comparison
9435               && XEXP (before_comparison, 0) == bl->biv->dest_reg
9436               && (GET_CODE (before_comparison) == LT
9437                   || GET_CODE (before_comparison) == LTU)
9438               && XEXP (before_comparison, 1) == const0_rtx
9439               && ! reg_set_between_p (bl->biv->dest_reg, p, loop_start)
9440               && INTVAL (bl->biv->add_val) == -1)
9441             {
9442               if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
9443                 REG_NOTES (jump)
9444                   = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
9445                                        REG_NOTES (jump));
9446               bl->nonneg = 1;
9447
9448               return 1;
9449             }
9450         }
9451     }
9452   else if (GET_CODE (bl->biv->add_val) == CONST_INT
9453            && INTVAL (bl->biv->add_val) > 0)
9454     {
9455       /* Try to change inc to dec, so can apply above optimization.  */
9456       /* Can do this if:
9457          all registers modified are induction variables or invariant,
9458          all memory references have non-overlapping addresses
9459          (obviously true if only one write)
9460          allow 2 insns for the compare/jump at the end of the loop.  */
9461       /* Also, we must avoid any instructions which use both the reversed
9462          biv and another biv.  Such instructions will fail if the loop is
9463          reversed.  We meet this condition by requiring that either
9464          no_use_except_counting is true, or else that there is only
9465          one biv.  */
9466       int num_nonfixed_reads = 0;
9467       /* 1 if the iteration var is used only to count iterations.  */
9468       int no_use_except_counting = 0;
9469       /* 1 if the loop has no memory store, or it has a single memory store
9470          which is reversible.  */
9471       int reversible_mem_store = 1;
9472
9473       if (bl->giv_count == 0
9474           && !loop->exit_count
9475           && !loop_info->has_multiple_exit_targets)
9476         {
9477           rtx bivreg = regno_reg_rtx[bl->regno];
9478           struct iv_class *blt;
9479
9480           /* If there are no givs for this biv, and the only exit is the
9481              fall through at the end of the loop, then
9482              see if perhaps there are no uses except to count.  */
9483           no_use_except_counting = 1;
9484           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
9485             if (INSN_P (p))
9486               {
9487                 rtx set = single_set (p);
9488
9489                 if (set && REG_P (SET_DEST (set))
9490                     && REGNO (SET_DEST (set)) == bl->regno)
9491                   /* An insn that sets the biv is okay.  */
9492                   ;
9493                 else if (!reg_mentioned_p (bivreg, PATTERN (p)))
9494                   /* An insn that doesn't mention the biv is okay.  */
9495                   ;
9496                 else if (p == prev_nonnote_insn (prev_nonnote_insn (loop_end))
9497                          || p == prev_nonnote_insn (loop_end))
9498                   {
9499                     /* If either of these insns uses the biv and sets a pseudo
9500                        that has more than one usage, then the biv has uses
9501                        other than counting since it's used to derive a value
9502                        that is used more than one time.  */
9503                     note_stores (PATTERN (p), note_set_pseudo_multiple_uses,
9504                                  regs);
9505                     if (regs->multiple_uses)
9506                       {
9507                         no_use_except_counting = 0;
9508                         break;
9509                       }
9510                   }
9511                 else
9512                   {
9513                     no_use_except_counting = 0;
9514                     break;
9515                   }
9516               }
9517
9518           /* A biv has uses besides counting if it is used to set
9519              another biv.  */
9520           for (blt = ivs->list; blt; blt = blt->next)
9521             if (blt->init_set
9522                 && reg_mentioned_p (bivreg, SET_SRC (blt->init_set)))
9523               {
9524                 no_use_except_counting = 0;
9525                 break;
9526               }
9527         }
9528
9529       if (no_use_except_counting)
9530         /* No need to worry about MEMs.  */
9531         ;
9532       else if (loop_info->num_mem_sets <= 1)
9533         {
9534           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
9535             if (INSN_P (p))
9536               num_nonfixed_reads += count_nonfixed_reads (loop, PATTERN (p));
9537
9538           /* If the loop has a single store, and the destination address is
9539              invariant, then we can't reverse the loop, because this address
9540              might then have the wrong value at loop exit.
9541              This would work if the source was invariant also, however, in that
9542              case, the insn should have been moved out of the loop.  */
9543
9544           if (loop_info->num_mem_sets == 1)
9545             {
9546               struct induction *v;
9547
9548               /* If we could prove that each of the memory locations
9549                  written to was different, then we could reverse the
9550                  store -- but we don't presently have any way of
9551                  knowing that.  */
9552               reversible_mem_store = 0;
9553
9554               /* If the store depends on a register that is set after the
9555                  store, it depends on the initial value, and is thus not
9556                  reversible.  */
9557               for (v = bl->giv; reversible_mem_store && v; v = v->next_iv)
9558                 {
9559                   if (v->giv_type == DEST_REG
9560                       && reg_mentioned_p (v->dest_reg,
9561                                           PATTERN (loop_info->first_loop_store_insn))
9562                       && loop_insn_first_p (loop_info->first_loop_store_insn,
9563                                             v->insn))
9564                     reversible_mem_store = 0;
9565                 }
9566             }
9567         }
9568       else
9569         return 0;
9570
9571       /* This code only acts for innermost loops.  Also it simplifies
9572          the memory address check by only reversing loops with
9573          zero or one memory access.
9574          Two memory accesses could involve parts of the same array,
9575          and that can't be reversed.
9576          If the biv is used only for counting, than we don't need to worry
9577          about all these things.  */
9578
9579       if ((num_nonfixed_reads <= 1
9580            && ! loop_info->has_nonconst_call
9581            && ! loop_info->has_prefetch
9582            && ! loop_info->has_volatile
9583            && reversible_mem_store
9584            && (bl->giv_count + bl->biv_count + loop_info->num_mem_sets
9585                + num_unmoved_movables (loop) + compare_and_branch == insn_count)
9586            && (bl == ivs->list && bl->next == 0))
9587           || (no_use_except_counting && ! loop_info->has_prefetch))
9588         {
9589           rtx tem;
9590
9591           /* Loop can be reversed.  */
9592           if (loop_dump_stream)
9593             fprintf (loop_dump_stream, "Can reverse loop\n");
9594
9595           /* Now check other conditions:
9596
9597              The increment must be a constant, as must the initial value,
9598              and the comparison code must be LT.
9599
9600              This test can probably be improved since +/- 1 in the constant
9601              can be obtained by changing LT to LE and vice versa; this is
9602              confusing.  */
9603
9604           if (comparison
9605               /* for constants, LE gets turned into LT */
9606               && (GET_CODE (comparison) == LT
9607                   || (GET_CODE (comparison) == LE
9608                       && no_use_except_counting)
9609                   || GET_CODE (comparison) == LTU))
9610             {
9611               HOST_WIDE_INT add_val, add_adjust, comparison_val = 0;
9612               rtx initial_value, comparison_value;
9613               int nonneg = 0;
9614               enum rtx_code cmp_code;
9615               int comparison_const_width;
9616               unsigned HOST_WIDE_INT comparison_sign_mask;
9617               bool keep_first_compare;
9618
9619               add_val = INTVAL (bl->biv->add_val);
9620               comparison_value = XEXP (comparison, 1);
9621               if (GET_MODE (comparison_value) == VOIDmode)
9622                 comparison_const_width
9623                   = GET_MODE_BITSIZE (GET_MODE (XEXP (comparison, 0)));
9624               else
9625                 comparison_const_width
9626                   = GET_MODE_BITSIZE (GET_MODE (comparison_value));
9627               if (comparison_const_width > HOST_BITS_PER_WIDE_INT)
9628                 comparison_const_width = HOST_BITS_PER_WIDE_INT;
9629               comparison_sign_mask
9630                 = (unsigned HOST_WIDE_INT) 1 << (comparison_const_width - 1);
9631
9632               /* If the comparison value is not a loop invariant, then we
9633                  can not reverse this loop.
9634
9635                  ??? If the insns which initialize the comparison value as
9636                  a whole compute an invariant result, then we could move
9637                  them out of the loop and proceed with loop reversal.  */
9638               if (! loop_invariant_p (loop, comparison_value))
9639                 return 0;
9640
9641               if (GET_CODE (comparison_value) == CONST_INT)
9642                 comparison_val = INTVAL (comparison_value);
9643               initial_value = bl->initial_value;
9644
9645               /* Normalize the initial value if it is an integer and
9646                  has no other use except as a counter.  This will allow
9647                  a few more loops to be reversed.  */
9648               if (no_use_except_counting
9649                   && GET_CODE (comparison_value) == CONST_INT
9650                   && GET_CODE (initial_value) == CONST_INT)
9651                 {
9652                   comparison_val = comparison_val - INTVAL (bl->initial_value);
9653                   /* The code below requires comparison_val to be a multiple
9654                      of add_val in order to do the loop reversal, so
9655                      round up comparison_val to a multiple of add_val.
9656                      Since comparison_value is constant, we know that the
9657                      current comparison code is LT.  */
9658                   comparison_val = comparison_val + add_val - 1;
9659                   comparison_val
9660                     -= (unsigned HOST_WIDE_INT) comparison_val % add_val;
9661                   /* We postpone overflow checks for COMPARISON_VAL here;
9662                      even if there is an overflow, we might still be able to
9663                      reverse the loop, if converting the loop exit test to
9664                      NE is possible.  */
9665                   initial_value = const0_rtx;
9666                 }
9667
9668               /* First check if we can do a vanilla loop reversal.  */
9669               if (initial_value == const0_rtx
9670                   && GET_CODE (comparison_value) == CONST_INT
9671                      /* Now do postponed overflow checks on COMPARISON_VAL.  */
9672                   && ! (((comparison_val - add_val) ^ INTVAL (comparison_value))
9673                         & comparison_sign_mask))
9674                 {
9675                   /* Register will always be nonnegative, with value
9676                      0 on last iteration */
9677                   add_adjust = add_val;
9678                   nonneg = 1;
9679                   cmp_code = GE;
9680                 }
9681               else
9682                 return 0;
9683
9684               if (GET_CODE (comparison) == LE)
9685                 add_adjust -= add_val;
9686
9687               /* If the initial value is not zero, or if the comparison
9688                  value is not an exact multiple of the increment, then we
9689                  can not reverse this loop.  */
9690               if (initial_value == const0_rtx
9691                   && GET_CODE (comparison_value) == CONST_INT)
9692                 {
9693                   if (((unsigned HOST_WIDE_INT) comparison_val % add_val) != 0)
9694                     return 0;
9695                 }
9696               else
9697                 {
9698                   if (! no_use_except_counting || add_val != 1)
9699                     return 0;
9700                 }
9701
9702               final_value = comparison_value;
9703
9704               /* Reset these in case we normalized the initial value
9705                  and comparison value above.  */
9706               if (GET_CODE (comparison_value) == CONST_INT
9707                   && GET_CODE (initial_value) == CONST_INT)
9708                 {
9709                   comparison_value = GEN_INT (comparison_val);
9710                   final_value
9711                     = GEN_INT (comparison_val + INTVAL (bl->initial_value));
9712                 }
9713               bl->initial_value = initial_value;
9714
9715               /* Save some info needed to produce the new insns.  */
9716               reg = bl->biv->dest_reg;
9717               mode = GET_MODE (reg);
9718               jump_label = condjump_label (PREV_INSN (loop_end));
9719               new_add_val = GEN_INT (-INTVAL (bl->biv->add_val));
9720
9721               /* Set start_value; if this is not a CONST_INT, we need
9722                  to generate a SUB.
9723                  Initialize biv to start_value before loop start.
9724                  The old initializing insn will be deleted as a
9725                  dead store by flow.c.  */
9726               if (initial_value == const0_rtx
9727                   && GET_CODE (comparison_value) == CONST_INT)
9728                 {
9729                   start_value
9730                     = gen_int_mode (comparison_val - add_adjust, mode);
9731                   loop_insn_hoist (loop, gen_move_insn (reg, start_value));
9732                 }
9733               else if (GET_CODE (initial_value) == CONST_INT)
9734                 {
9735                   rtx offset = GEN_INT (-INTVAL (initial_value) - add_adjust);
9736                   rtx add_insn = gen_add3_insn (reg, comparison_value, offset);
9737
9738                   if (add_insn == 0)
9739                     return 0;
9740
9741                   start_value
9742                     = gen_rtx_PLUS (mode, comparison_value, offset);
9743                   loop_insn_hoist (loop, add_insn);
9744                   if (GET_CODE (comparison) == LE)
9745                     final_value = gen_rtx_PLUS (mode, comparison_value,
9746                                                 GEN_INT (add_val));
9747                 }
9748               else if (! add_adjust)
9749                 {
9750                   rtx sub_insn = gen_sub3_insn (reg, comparison_value,
9751                                                 initial_value);
9752
9753                   if (sub_insn == 0)
9754                     return 0;
9755                   start_value
9756                     = gen_rtx_MINUS (mode, comparison_value, initial_value);
9757                   loop_insn_hoist (loop, sub_insn);
9758                 }
9759               else
9760                 /* We could handle the other cases too, but it'll be
9761                    better to have a testcase first.  */
9762                 return 0;
9763
9764               /* We may not have a single insn which can increment a reg, so
9765                  create a sequence to hold all the insns from expand_inc.  */
9766               start_sequence ();
9767               expand_inc (reg, new_add_val);
9768               tem = get_insns ();
9769               end_sequence ();
9770
9771               p = loop_insn_emit_before (loop, 0, bl->biv->insn, tem);
9772               delete_insn (bl->biv->insn);
9773
9774               /* Update biv info to reflect its new status.  */
9775               bl->biv->insn = p;
9776               bl->initial_value = start_value;
9777               bl->biv->add_val = new_add_val;
9778
9779               /* Update loop info.  */
9780               loop_info->initial_value = reg;
9781               loop_info->initial_equiv_value = reg;
9782               loop_info->final_value = const0_rtx;
9783               loop_info->final_equiv_value = const0_rtx;
9784               loop_info->comparison_value = const0_rtx;
9785               loop_info->comparison_code = cmp_code;
9786               loop_info->increment = new_add_val;
9787
9788               /* Inc LABEL_NUSES so that delete_insn will
9789                  not delete the label.  */
9790               LABEL_NUSES (XEXP (jump_label, 0))++;
9791
9792               /* If we have a separate comparison insn that does more
9793                  than just set cc0, the result of the comparison might
9794                  be used outside the loop.  */
9795               keep_first_compare = (compare_and_branch == 2
9796 #ifdef HAVE_CC0
9797                                     && sets_cc0_p (first_compare) <= 0
9798 #endif
9799                                     );
9800
9801               /* Emit an insn after the end of the loop to set the biv's
9802                  proper exit value if it is used anywhere outside the loop.  */
9803               if (keep_first_compare
9804                   || (REGNO_LAST_UID (bl->regno) != INSN_UID (first_compare))
9805                   || ! bl->init_insn
9806                   || REGNO_FIRST_UID (bl->regno) != INSN_UID (bl->init_insn))
9807                 loop_insn_sink (loop, gen_load_of_final_value (reg, final_value));
9808
9809               if (keep_first_compare)
9810                 loop_insn_sink (loop, PATTERN (first_compare));
9811
9812               /* Delete compare/branch at end of loop.  */
9813               delete_related_insns (PREV_INSN (loop_end));
9814               if (compare_and_branch == 2)
9815                 delete_related_insns (first_compare);
9816
9817               /* Add new compare/branch insn at end of loop.  */
9818               start_sequence ();
9819               emit_cmp_and_jump_insns (reg, const0_rtx, cmp_code, NULL_RTX,
9820                                        mode, 0,
9821                                        XEXP (jump_label, 0));
9822               tem = get_insns ();
9823               end_sequence ();
9824               emit_jump_insn_before (tem, loop_end);
9825
9826               for (tem = PREV_INSN (loop_end);
9827                    tem && !JUMP_P (tem);
9828                    tem = PREV_INSN (tem))
9829                 ;
9830
9831               if (tem)
9832                 JUMP_LABEL (tem) = XEXP (jump_label, 0);
9833
9834               if (nonneg)
9835                 {
9836                   if (tem)
9837                     {
9838                       /* Increment of LABEL_NUSES done above.  */
9839                       /* Register is now always nonnegative,
9840                          so add REG_NONNEG note to the branch.  */
9841                       REG_NOTES (tem) = gen_rtx_EXPR_LIST (REG_NONNEG, reg,
9842                                                            REG_NOTES (tem));
9843                     }
9844                   bl->nonneg = 1;
9845                 }
9846
9847               /* No insn may reference both the reversed and another biv or it
9848                  will fail (see comment near the top of the loop reversal
9849                  code).
9850                  Earlier on, we have verified that the biv has no use except
9851                  counting, or it is the only biv in this function.
9852                  However, the code that computes no_use_except_counting does
9853                  not verify reg notes.  It's possible to have an insn that
9854                  references another biv, and has a REG_EQUAL note with an
9855                  expression based on the reversed biv.  To avoid this case,
9856                  remove all REG_EQUAL notes based on the reversed biv
9857                  here.  */
9858               for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
9859                 if (INSN_P (p))
9860                   {
9861                     rtx *pnote;
9862                     rtx set = single_set (p);
9863                     /* If this is a set of a GIV based on the reversed biv, any
9864                        REG_EQUAL notes should still be correct.  */
9865                     if (! set
9866                         || !REG_P (SET_DEST (set))
9867                         || (size_t) REGNO (SET_DEST (set)) >= ivs->n_regs
9868                         || REG_IV_TYPE (ivs, REGNO (SET_DEST (set))) != GENERAL_INDUCT
9869                         || REG_IV_INFO (ivs, REGNO (SET_DEST (set)))->src_reg != bl->biv->src_reg)
9870                       for (pnote = &REG_NOTES (p); *pnote;)
9871                         {
9872                           if (REG_NOTE_KIND (*pnote) == REG_EQUAL
9873                               && reg_mentioned_p (regno_reg_rtx[bl->regno],
9874                                                   XEXP (*pnote, 0)))
9875                             *pnote = XEXP (*pnote, 1);
9876                           else
9877                             pnote = &XEXP (*pnote, 1);
9878                         }
9879                   }
9880
9881               /* Mark that this biv has been reversed.  Each giv which depends
9882                  on this biv, and which is also live past the end of the loop
9883                  will have to be fixed up.  */
9884
9885               bl->reversed = 1;
9886
9887               if (loop_dump_stream)
9888                 {
9889                   fprintf (loop_dump_stream, "Reversed loop");
9890                   if (bl->nonneg)
9891                     fprintf (loop_dump_stream, " and added reg_nonneg\n");
9892                   else
9893                     fprintf (loop_dump_stream, "\n");
9894                 }
9895
9896               return 1;
9897             }
9898         }
9899     }
9900
9901   return 0;
9902 }
9903 \f
9904 /* Verify whether the biv BL appears to be eliminable,
9905    based on the insns in the loop that refer to it.
9906
9907    If ELIMINATE_P is nonzero, actually do the elimination.
9908
9909    THRESHOLD and INSN_COUNT are from loop_optimize and are used to
9910    determine whether invariant insns should be placed inside or at the
9911    start of the loop.  */
9912
9913 static int
9914 maybe_eliminate_biv (const struct loop *loop, struct iv_class *bl,
9915                      int eliminate_p, int threshold, int insn_count)
9916 {
9917   struct loop_ivs *ivs = LOOP_IVS (loop);
9918   rtx reg = bl->biv->dest_reg;
9919   rtx p;
9920
9921   /* Scan all insns in the loop, stopping if we find one that uses the
9922      biv in a way that we cannot eliminate.  */
9923
9924   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
9925     {
9926       enum rtx_code code = GET_CODE (p);
9927       basic_block where_bb = 0;
9928       rtx where_insn = threshold >= insn_count ? 0 : p;
9929       rtx note;
9930
9931       /* If this is a libcall that sets a giv, skip ahead to its end.  */
9932       if (INSN_P (p))
9933         {
9934           note = find_reg_note (p, REG_LIBCALL, NULL_RTX);
9935
9936           if (note)
9937             {
9938               rtx last = XEXP (note, 0);
9939               rtx set = single_set (last);
9940
9941               if (set && REG_P (SET_DEST (set)))
9942                 {
9943                   unsigned int regno = REGNO (SET_DEST (set));
9944
9945                   if (regno < ivs->n_regs
9946                       && REG_IV_TYPE (ivs, regno) == GENERAL_INDUCT
9947                       && REG_IV_INFO (ivs, regno)->src_reg == bl->biv->src_reg)
9948                     p = last;
9949                 }
9950             }
9951         }
9952
9953       /* Closely examine the insn if the biv is mentioned.  */
9954       if ((code == INSN || code == JUMP_INSN || code == CALL_INSN)
9955           && reg_mentioned_p (reg, PATTERN (p))
9956           && ! maybe_eliminate_biv_1 (loop, PATTERN (p), p, bl,
9957                                       eliminate_p, where_bb, where_insn))
9958         {
9959           if (loop_dump_stream)
9960             fprintf (loop_dump_stream,
9961                      "Cannot eliminate biv %d: biv used in insn %d.\n",
9962                      bl->regno, INSN_UID (p));
9963           break;
9964         }
9965
9966       /* If we are eliminating, kill REG_EQUAL notes mentioning the biv.  */
9967       if (eliminate_p
9968           && (note = find_reg_note (p, REG_EQUAL, NULL_RTX)) != NULL_RTX
9969           && reg_mentioned_p (reg, XEXP (note, 0)))
9970         remove_note (p, note);
9971     }
9972
9973   if (p == loop->end)
9974     {
9975       if (loop_dump_stream)
9976         fprintf (loop_dump_stream, "biv %d %s eliminated.\n",
9977                  bl->regno, eliminate_p ? "was" : "can be");
9978       return 1;
9979     }
9980
9981   return 0;
9982 }
9983 \f
9984 /* INSN and REFERENCE are instructions in the same insn chain.
9985    Return nonzero if INSN is first.  */
9986
9987 static int
9988 loop_insn_first_p (rtx insn, rtx reference)
9989 {
9990   rtx p, q;
9991
9992   for (p = insn, q = reference;;)
9993     {
9994       /* Start with test for not first so that INSN == REFERENCE yields not
9995          first.  */
9996       if (q == insn || ! p)
9997         return 0;
9998       if (p == reference || ! q)
9999         return 1;
10000
10001       /* Either of P or Q might be a NOTE.  Notes have the same LUID as the
10002          previous insn, hence the <= comparison below does not work if
10003          P is a note.  */
10004       if (INSN_UID (p) < max_uid_for_loop
10005           && INSN_UID (q) < max_uid_for_loop
10006           && !NOTE_P (p))
10007         return INSN_LUID (p) <= INSN_LUID (q);
10008
10009       if (INSN_UID (p) >= max_uid_for_loop
10010           || NOTE_P (p))
10011         p = NEXT_INSN (p);
10012       if (INSN_UID (q) >= max_uid_for_loop)
10013         q = NEXT_INSN (q);
10014     }
10015 }
10016
10017 /* We are trying to eliminate BIV in INSN using GIV.  Return nonzero if
10018    the offset that we have to take into account due to auto-increment /
10019    div derivation is zero.  */
10020 static int
10021 biv_elimination_giv_has_0_offset (struct induction *biv,
10022                                   struct induction *giv, rtx insn)
10023 {
10024   /* If the giv V had the auto-inc address optimization applied
10025      to it, and INSN occurs between the giv insn and the biv
10026      insn, then we'd have to adjust the value used here.
10027      This is rare, so we don't bother to make this possible.  */
10028   if (giv->auto_inc_opt
10029       && ((loop_insn_first_p (giv->insn, insn)
10030            && loop_insn_first_p (insn, biv->insn))
10031           || (loop_insn_first_p (biv->insn, insn)
10032               && loop_insn_first_p (insn, giv->insn))))
10033     return 0;
10034
10035   return 1;
10036 }
10037
10038 /* If BL appears in X (part of the pattern of INSN), see if we can
10039    eliminate its use.  If so, return 1.  If not, return 0.
10040
10041    If BIV does not appear in X, return 1.
10042
10043    If ELIMINATE_P is nonzero, actually do the elimination.
10044    WHERE_INSN/WHERE_BB indicate where extra insns should be added.
10045    Depending on how many items have been moved out of the loop, it
10046    will either be before INSN (when WHERE_INSN is nonzero) or at the
10047    start of the loop (when WHERE_INSN is zero).  */
10048
10049 static int
10050 maybe_eliminate_biv_1 (const struct loop *loop, rtx x, rtx insn,
10051                        struct iv_class *bl, int eliminate_p,
10052                        basic_block where_bb, rtx where_insn)
10053 {
10054   enum rtx_code code = GET_CODE (x);
10055   rtx reg = bl->biv->dest_reg;
10056   enum machine_mode mode = GET_MODE (reg);
10057   struct induction *v;
10058   rtx arg, tem;
10059 #ifdef HAVE_cc0
10060   rtx new;
10061 #endif
10062   int arg_operand;
10063   const char *fmt;
10064   int i, j;
10065
10066   switch (code)
10067     {
10068     case REG:
10069       /* If we haven't already been able to do something with this BIV,
10070          we can't eliminate it.  */
10071       if (x == reg)
10072         return 0;
10073       return 1;
10074
10075     case SET:
10076       /* If this sets the BIV, it is not a problem.  */
10077       if (SET_DEST (x) == reg)
10078         return 1;
10079
10080       /* If this is an insn that defines a giv, it is also ok because
10081          it will go away when the giv is reduced.  */
10082       for (v = bl->giv; v; v = v->next_iv)
10083         if (v->giv_type == DEST_REG && SET_DEST (x) == v->dest_reg)
10084           return 1;
10085
10086 #ifdef HAVE_cc0
10087       if (SET_DEST (x) == cc0_rtx && SET_SRC (x) == reg)
10088         {
10089           /* Can replace with any giv that was reduced and
10090              that has (MULT_VAL != 0) and (ADD_VAL == 0).
10091              Require a constant for MULT_VAL, so we know it's nonzero.
10092              ??? We disable this optimization to avoid potential
10093              overflows.  */
10094
10095           for (v = bl->giv; v; v = v->next_iv)
10096             if (GET_CODE (v->mult_val) == CONST_INT && v->mult_val != const0_rtx
10097                 && v->add_val == const0_rtx
10098                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10099                 && v->mode == mode
10100                 && 0)
10101               {
10102                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10103                   continue;
10104
10105                 if (! eliminate_p)
10106                   return 1;
10107
10108                 /* If the giv has the opposite direction of change,
10109                    then reverse the comparison.  */
10110                 if (INTVAL (v->mult_val) < 0)
10111                   new = gen_rtx_COMPARE (GET_MODE (v->new_reg),
10112                                          const0_rtx, v->new_reg);
10113                 else
10114                   new = v->new_reg;
10115
10116                 /* We can probably test that giv's reduced reg.  */
10117                 if (validate_change (insn, &SET_SRC (x), new, 0))
10118                   return 1;
10119               }
10120
10121           /* Look for a giv with (MULT_VAL != 0) and (ADD_VAL != 0);
10122              replace test insn with a compare insn (cmp REDUCED_GIV ADD_VAL).
10123              Require a constant for MULT_VAL, so we know it's nonzero.
10124              ??? Do this only if ADD_VAL is a pointer to avoid a potential
10125              overflow problem.  */
10126
10127           for (v = bl->giv; v; v = v->next_iv)
10128             if (GET_CODE (v->mult_val) == CONST_INT
10129                 && v->mult_val != const0_rtx
10130                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10131                 && v->mode == mode
10132                 && (GET_CODE (v->add_val) == SYMBOL_REF
10133                     || GET_CODE (v->add_val) == LABEL_REF
10134                     || GET_CODE (v->add_val) == CONST
10135                     || (REG_P (v->add_val)
10136                         && REG_POINTER (v->add_val))))
10137               {
10138                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10139                   continue;
10140
10141                 if (! eliminate_p)
10142                   return 1;
10143
10144                 /* If the giv has the opposite direction of change,
10145                    then reverse the comparison.  */
10146                 if (INTVAL (v->mult_val) < 0)
10147                   new = gen_rtx_COMPARE (VOIDmode, copy_rtx (v->add_val),
10148                                          v->new_reg);
10149                 else
10150                   new = gen_rtx_COMPARE (VOIDmode, v->new_reg,
10151                                          copy_rtx (v->add_val));
10152
10153                 /* Replace biv with the giv's reduced register.  */
10154                 update_reg_last_use (v->add_val, insn);
10155                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
10156                   return 1;
10157
10158                 /* Insn doesn't support that constant or invariant.  Copy it
10159                    into a register (it will be a loop invariant.)  */
10160                 tem = gen_reg_rtx (GET_MODE (v->new_reg));
10161
10162                 loop_insn_emit_before (loop, 0, where_insn,
10163                                        gen_move_insn (tem,
10164                                                       copy_rtx (v->add_val)));
10165
10166                 /* Substitute the new register for its invariant value in
10167                    the compare expression.  */
10168                 XEXP (new, (INTVAL (v->mult_val) < 0) ? 0 : 1) = tem;
10169                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
10170                   return 1;
10171               }
10172         }
10173 #endif
10174       break;
10175
10176     case COMPARE:
10177     case EQ:  case NE:
10178     case GT:  case GE:  case GTU:  case GEU:
10179     case LT:  case LE:  case LTU:  case LEU:
10180       /* See if either argument is the biv.  */
10181       if (XEXP (x, 0) == reg)
10182         arg = XEXP (x, 1), arg_operand = 1;
10183       else if (XEXP (x, 1) == reg)
10184         arg = XEXP (x, 0), arg_operand = 0;
10185       else
10186         break;
10187
10188       if (CONSTANT_P (arg))
10189         {
10190           /* First try to replace with any giv that has constant positive
10191              mult_val and constant add_val.  We might be able to support
10192              negative mult_val, but it seems complex to do it in general.  */
10193
10194           for (v = bl->giv; v; v = v->next_iv)
10195             if (GET_CODE (v->mult_val) == CONST_INT
10196                 && INTVAL (v->mult_val) > 0
10197                 && (GET_CODE (v->add_val) == SYMBOL_REF
10198                     || GET_CODE (v->add_val) == LABEL_REF
10199                     || GET_CODE (v->add_val) == CONST
10200                     || (REG_P (v->add_val)
10201                         && REG_POINTER (v->add_val)))
10202                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10203                 && v->mode == mode)
10204               {
10205                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10206                   continue;
10207
10208                 /* Don't eliminate if the linear combination that makes up
10209                    the giv overflows when it is applied to ARG.  */
10210                 if (GET_CODE (arg) == CONST_INT)
10211                   {
10212                     rtx add_val;
10213
10214                     if (GET_CODE (v->add_val) == CONST_INT)
10215                       add_val = v->add_val;
10216                     else
10217                       add_val = const0_rtx;
10218
10219                     if (const_mult_add_overflow_p (arg, v->mult_val,
10220                                                    add_val, mode, 1))
10221                       continue;
10222                   }
10223
10224                 if (! eliminate_p)
10225                   return 1;
10226
10227                 /* Replace biv with the giv's reduced reg.  */
10228                 validate_change (insn, &XEXP (x, 1 - arg_operand), v->new_reg, 1);
10229
10230                 /* If all constants are actually constant integers and
10231                    the derived constant can be directly placed in the COMPARE,
10232                    do so.  */
10233                 if (GET_CODE (arg) == CONST_INT
10234                     && GET_CODE (v->add_val) == CONST_INT)
10235                   {
10236                     tem = expand_mult_add (arg, NULL_RTX, v->mult_val,
10237                                            v->add_val, mode, 1);
10238                   }
10239                 else
10240                   {
10241                     /* Otherwise, load it into a register.  */
10242                     tem = gen_reg_rtx (mode);
10243                     loop_iv_add_mult_emit_before (loop, arg,
10244                                                   v->mult_val, v->add_val,
10245                                                   tem, where_bb, where_insn);
10246                   }
10247
10248                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
10249
10250                 if (apply_change_group ())
10251                   return 1;
10252               }
10253
10254           /* Look for giv with positive constant mult_val and nonconst add_val.
10255              Insert insns to calculate new compare value.
10256              ??? Turn this off due to possible overflow.  */
10257
10258           for (v = bl->giv; v; v = v->next_iv)
10259             if (GET_CODE (v->mult_val) == CONST_INT
10260                 && INTVAL (v->mult_val) > 0
10261                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10262                 && v->mode == mode
10263                 && 0)
10264               {
10265                 rtx tem;
10266
10267                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10268                   continue;
10269
10270                 if (! eliminate_p)
10271                   return 1;
10272
10273                 tem = gen_reg_rtx (mode);
10274
10275                 /* Replace biv with giv's reduced register.  */
10276                 validate_change (insn, &XEXP (x, 1 - arg_operand),
10277                                  v->new_reg, 1);
10278
10279                 /* Compute value to compare against.  */
10280                 loop_iv_add_mult_emit_before (loop, arg,
10281                                               v->mult_val, v->add_val,
10282                                               tem, where_bb, where_insn);
10283                 /* Use it in this insn.  */
10284                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
10285                 if (apply_change_group ())
10286                   return 1;
10287               }
10288         }
10289       else if (REG_P (arg) || MEM_P (arg))
10290         {
10291           if (loop_invariant_p (loop, arg) == 1)
10292             {
10293               /* Look for giv with constant positive mult_val and nonconst
10294                  add_val. Insert insns to compute new compare value.
10295                  ??? Turn this off due to possible overflow.  */
10296
10297               for (v = bl->giv; v; v = v->next_iv)
10298                 if (GET_CODE (v->mult_val) == CONST_INT && INTVAL (v->mult_val) > 0
10299                     && ! v->ignore && ! v->maybe_dead && v->always_computable
10300                     && v->mode == mode
10301                     && 0)
10302                   {
10303                     rtx tem;
10304
10305                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10306                       continue;
10307
10308                     if (! eliminate_p)
10309                       return 1;
10310
10311                     tem = gen_reg_rtx (mode);
10312
10313                     /* Replace biv with giv's reduced register.  */
10314                     validate_change (insn, &XEXP (x, 1 - arg_operand),
10315                                      v->new_reg, 1);
10316
10317                     /* Compute value to compare against.  */
10318                     loop_iv_add_mult_emit_before (loop, arg,
10319                                                   v->mult_val, v->add_val,
10320                                                   tem, where_bb, where_insn);
10321                     validate_change (insn, &XEXP (x, arg_operand), tem, 1);
10322                     if (apply_change_group ())
10323                       return 1;
10324                   }
10325             }
10326
10327           /* This code has problems.  Basically, you can't know when
10328              seeing if we will eliminate BL, whether a particular giv
10329              of ARG will be reduced.  If it isn't going to be reduced,
10330              we can't eliminate BL.  We can try forcing it to be reduced,
10331              but that can generate poor code.
10332
10333              The problem is that the benefit of reducing TV, below should
10334              be increased if BL can actually be eliminated, but this means
10335              we might have to do a topological sort of the order in which
10336              we try to process biv.  It doesn't seem worthwhile to do
10337              this sort of thing now.  */
10338
10339 #if 0
10340           /* Otherwise the reg compared with had better be a biv.  */
10341           if (!REG_P (arg)
10342               || REG_IV_TYPE (ivs, REGNO (arg)) != BASIC_INDUCT)
10343             return 0;
10344
10345           /* Look for a pair of givs, one for each biv,
10346              with identical coefficients.  */
10347           for (v = bl->giv; v; v = v->next_iv)
10348             {
10349               struct induction *tv;
10350
10351               if (v->ignore || v->maybe_dead || v->mode != mode)
10352                 continue;
10353
10354               for (tv = REG_IV_CLASS (ivs, REGNO (arg))->giv; tv;
10355                    tv = tv->next_iv)
10356                 if (! tv->ignore && ! tv->maybe_dead
10357                     && rtx_equal_p (tv->mult_val, v->mult_val)
10358                     && rtx_equal_p (tv->add_val, v->add_val)
10359                     && tv->mode == mode)
10360                   {
10361                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10362                       continue;
10363
10364                     if (! eliminate_p)
10365                       return 1;
10366
10367                     /* Replace biv with its giv's reduced reg.  */
10368                     XEXP (x, 1 - arg_operand) = v->new_reg;
10369                     /* Replace other operand with the other giv's
10370                        reduced reg.  */
10371                     XEXP (x, arg_operand) = tv->new_reg;
10372                     return 1;
10373                   }
10374             }
10375 #endif
10376         }
10377
10378       /* If we get here, the biv can't be eliminated.  */
10379       return 0;
10380
10381     case MEM:
10382       /* If this address is a DEST_ADDR giv, it doesn't matter if the
10383          biv is used in it, since it will be replaced.  */
10384       for (v = bl->giv; v; v = v->next_iv)
10385         if (v->giv_type == DEST_ADDR && v->location == &XEXP (x, 0))
10386           return 1;
10387       break;
10388
10389     default:
10390       break;
10391     }
10392
10393   /* See if any subexpression fails elimination.  */
10394   fmt = GET_RTX_FORMAT (code);
10395   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
10396     {
10397       switch (fmt[i])
10398         {
10399         case 'e':
10400           if (! maybe_eliminate_biv_1 (loop, XEXP (x, i), insn, bl,
10401                                        eliminate_p, where_bb, where_insn))
10402             return 0;
10403           break;
10404
10405         case 'E':
10406           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
10407             if (! maybe_eliminate_biv_1 (loop, XVECEXP (x, i, j), insn, bl,
10408                                          eliminate_p, where_bb, where_insn))
10409               return 0;
10410           break;
10411         }
10412     }
10413
10414   return 1;
10415 }
10416 \f
10417 /* Return nonzero if the last use of REG
10418    is in an insn following INSN in the same basic block.  */
10419
10420 static int
10421 last_use_this_basic_block (rtx reg, rtx insn)
10422 {
10423   rtx n;
10424   for (n = insn;
10425        n && !LABEL_P (n) && !JUMP_P (n);
10426        n = NEXT_INSN (n))
10427     {
10428       if (REGNO_LAST_UID (REGNO (reg)) == INSN_UID (n))
10429         return 1;
10430     }
10431   return 0;
10432 }
10433 \f
10434 /* Called via `note_stores' to record the initial value of a biv.  Here we
10435    just record the location of the set and process it later.  */
10436
10437 static void
10438 record_initial (rtx dest, rtx set, void *data ATTRIBUTE_UNUSED)
10439 {
10440   struct loop_ivs *ivs = (struct loop_ivs *) data;
10441   struct iv_class *bl;
10442
10443   if (!REG_P (dest)
10444       || REGNO (dest) >= ivs->n_regs
10445       || REG_IV_TYPE (ivs, REGNO (dest)) != BASIC_INDUCT)
10446     return;
10447
10448   bl = REG_IV_CLASS (ivs, REGNO (dest));
10449
10450   /* If this is the first set found, record it.  */
10451   if (bl->init_insn == 0)
10452     {
10453       bl->init_insn = note_insn;
10454       bl->init_set = set;
10455     }
10456 }
10457 \f
10458 /* If any of the registers in X are "old" and currently have a last use earlier
10459    than INSN, update them to have a last use of INSN.  Their actual last use
10460    will be the previous insn but it will not have a valid uid_luid so we can't
10461    use it.  X must be a source expression only.  */
10462
10463 static void
10464 update_reg_last_use (rtx x, rtx insn)
10465 {
10466   /* Check for the case where INSN does not have a valid luid.  In this case,
10467      there is no need to modify the regno_last_uid, as this can only happen
10468      when code is inserted after the loop_end to set a pseudo's final value,
10469      and hence this insn will never be the last use of x.
10470      ???? This comment is not correct.  See for example loop_givs_reduce.
10471      This may insert an insn before another new insn.  */
10472   if (REG_P (x) && REGNO (x) < max_reg_before_loop
10473       && INSN_UID (insn) < max_uid_for_loop
10474       && REGNO_LAST_LUID (REGNO (x)) < INSN_LUID (insn))
10475     {
10476       REGNO_LAST_UID (REGNO (x)) = INSN_UID (insn);
10477     }
10478   else
10479     {
10480       int i, j;
10481       const char *fmt = GET_RTX_FORMAT (GET_CODE (x));
10482       for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--)
10483         {
10484           if (fmt[i] == 'e')
10485             update_reg_last_use (XEXP (x, i), insn);
10486           else if (fmt[i] == 'E')
10487             for (j = XVECLEN (x, i) - 1; j >= 0; j--)
10488               update_reg_last_use (XVECEXP (x, i, j), insn);
10489         }
10490     }
10491 }
10492 \f
10493 /* Similar to rtlanal.c:get_condition, except that we also put an
10494    invariant last unless both operands are invariants.  */
10495
10496 static rtx
10497 get_condition_for_loop (const struct loop *loop, rtx x)
10498 {
10499   rtx comparison = get_condition (x, (rtx*) 0, false, true);
10500
10501   if (comparison == 0
10502       || ! loop_invariant_p (loop, XEXP (comparison, 0))
10503       || loop_invariant_p (loop, XEXP (comparison, 1)))
10504     return comparison;
10505
10506   return gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)), VOIDmode,
10507                          XEXP (comparison, 1), XEXP (comparison, 0));
10508 }
10509
10510 /* Scan the function and determine whether it has indirect (computed) jumps.
10511
10512    This is taken mostly from flow.c; similar code exists elsewhere
10513    in the compiler.  It may be useful to put this into rtlanal.c.  */
10514 static int
10515 indirect_jump_in_function_p (rtx start)
10516 {
10517   rtx insn;
10518
10519   for (insn = start; insn; insn = NEXT_INSN (insn))
10520     if (computed_jump_p (insn))
10521       return 1;
10522
10523   return 0;
10524 }
10525
10526 /* Add MEM to the LOOP_MEMS array, if appropriate.  See the
10527    documentation for LOOP_MEMS for the definition of `appropriate'.
10528    This function is called from prescan_loop via for_each_rtx.  */
10529
10530 static int
10531 insert_loop_mem (rtx *mem, void *data ATTRIBUTE_UNUSED)
10532 {
10533   struct loop_info *loop_info = data;
10534   int i;
10535   rtx m = *mem;
10536
10537   if (m == NULL_RTX)
10538     return 0;
10539
10540   switch (GET_CODE (m))
10541     {
10542     case MEM:
10543       break;
10544
10545     case CLOBBER:
10546       /* We're not interested in MEMs that are only clobbered.  */
10547       return -1;
10548
10549     case CONST_DOUBLE:
10550       /* We're not interested in the MEM associated with a
10551          CONST_DOUBLE, so there's no need to traverse into this.  */
10552       return -1;
10553
10554     case EXPR_LIST:
10555       /* We're not interested in any MEMs that only appear in notes.  */
10556       return -1;
10557
10558     default:
10559       /* This is not a MEM.  */
10560       return 0;
10561     }
10562
10563   /* See if we've already seen this MEM.  */
10564   for (i = 0; i < loop_info->mems_idx; ++i)
10565     if (rtx_equal_p (m, loop_info->mems[i].mem))
10566       {
10567         if (MEM_VOLATILE_P (m) && !MEM_VOLATILE_P (loop_info->mems[i].mem))
10568           loop_info->mems[i].mem = m;
10569         if (GET_MODE (m) != GET_MODE (loop_info->mems[i].mem))
10570           /* The modes of the two memory accesses are different.  If
10571              this happens, something tricky is going on, and we just
10572              don't optimize accesses to this MEM.  */
10573           loop_info->mems[i].optimize = 0;
10574
10575         return 0;
10576       }
10577
10578   /* Resize the array, if necessary.  */
10579   if (loop_info->mems_idx == loop_info->mems_allocated)
10580     {
10581       if (loop_info->mems_allocated != 0)
10582         loop_info->mems_allocated *= 2;
10583       else
10584         loop_info->mems_allocated = 32;
10585
10586       loop_info->mems = xrealloc (loop_info->mems,
10587                                   loop_info->mems_allocated * sizeof (loop_mem_info));
10588     }
10589
10590   /* Actually insert the MEM.  */
10591   loop_info->mems[loop_info->mems_idx].mem = m;
10592   /* We can't hoist this MEM out of the loop if it's a BLKmode MEM
10593      because we can't put it in a register.  We still store it in the
10594      table, though, so that if we see the same address later, but in a
10595      non-BLK mode, we'll not think we can optimize it at that point.  */
10596   loop_info->mems[loop_info->mems_idx].optimize = (GET_MODE (m) != BLKmode);
10597   loop_info->mems[loop_info->mems_idx].reg = NULL_RTX;
10598   ++loop_info->mems_idx;
10599
10600   return 0;
10601 }
10602
10603
10604 /* Allocate REGS->ARRAY or reallocate it if it is too small.
10605
10606    Increment REGS->ARRAY[I].SET_IN_LOOP at the index I of each
10607    register that is modified by an insn between FROM and TO.  If the
10608    value of an element of REGS->array[I].SET_IN_LOOP becomes 127 or
10609    more, stop incrementing it, to avoid overflow.
10610
10611    Store in REGS->ARRAY[I].SINGLE_USAGE the single insn in which
10612    register I is used, if it is only used once.  Otherwise, it is set
10613    to 0 (for no uses) or const0_rtx for more than one use.  This
10614    parameter may be zero, in which case this processing is not done.
10615
10616    Set REGS->ARRAY[I].MAY_NOT_OPTIMIZE nonzero if we should not
10617    optimize register I.  */
10618
10619 static void
10620 loop_regs_scan (const struct loop *loop, int extra_size)
10621 {
10622   struct loop_regs *regs = LOOP_REGS (loop);
10623   int old_nregs;
10624   /* last_set[n] is nonzero iff reg n has been set in the current
10625    basic block.  In that case, it is the insn that last set reg n.  */
10626   rtx *last_set;
10627   rtx insn;
10628   int i;
10629
10630   old_nregs = regs->num;
10631   regs->num = max_reg_num ();
10632
10633   /* Grow the regs array if not allocated or too small.  */
10634   if (regs->num >= regs->size)
10635     {
10636       regs->size = regs->num + extra_size;
10637
10638       regs->array = xrealloc (regs->array, regs->size * sizeof (*regs->array));
10639
10640       /* Zero the new elements.  */
10641       memset (regs->array + old_nregs, 0,
10642               (regs->size - old_nregs) * sizeof (*regs->array));
10643     }
10644
10645   /* Clear previously scanned fields but do not clear n_times_set.  */
10646   for (i = 0; i < old_nregs; i++)
10647     {
10648       regs->array[i].set_in_loop = 0;
10649       regs->array[i].may_not_optimize = 0;
10650       regs->array[i].single_usage = NULL_RTX;
10651     }
10652
10653   last_set = xcalloc (regs->num, sizeof (rtx));
10654
10655   /* Scan the loop, recording register usage.  */
10656   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
10657        insn = NEXT_INSN (insn))
10658     {
10659       if (INSN_P (insn))
10660         {
10661           /* Record registers that have exactly one use.  */
10662           find_single_use_in_loop (regs, insn, PATTERN (insn));
10663
10664           /* Include uses in REG_EQUAL notes.  */
10665           if (REG_NOTES (insn))
10666             find_single_use_in_loop (regs, insn, REG_NOTES (insn));
10667
10668           if (GET_CODE (PATTERN (insn)) == SET
10669               || GET_CODE (PATTERN (insn)) == CLOBBER)
10670             count_one_set (regs, insn, PATTERN (insn), last_set);
10671           else if (GET_CODE (PATTERN (insn)) == PARALLEL)
10672             {
10673               int i;
10674               for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
10675                 count_one_set (regs, insn, XVECEXP (PATTERN (insn), 0, i),
10676                                last_set);
10677             }
10678         }
10679
10680       if (LABEL_P (insn) || JUMP_P (insn))
10681         memset (last_set, 0, regs->num * sizeof (rtx));
10682
10683       /* Invalidate all registers used for function argument passing.
10684          We check rtx_varies_p for the same reason as below, to allow
10685          optimizing PIC calculations.  */
10686       if (CALL_P (insn))
10687         {
10688           rtx link;
10689           for (link = CALL_INSN_FUNCTION_USAGE (insn);
10690                link;
10691                link = XEXP (link, 1))
10692             {
10693               rtx op, reg;
10694
10695               if (GET_CODE (op = XEXP (link, 0)) == USE
10696                   && REG_P (reg = XEXP (op, 0))
10697                   && rtx_varies_p (reg, 1))
10698                 regs->array[REGNO (reg)].may_not_optimize = 1;
10699             }
10700         }
10701     }
10702
10703   /* Invalidate all hard registers clobbered by calls.  With one exception:
10704      a call-clobbered PIC register is still function-invariant for our
10705      purposes, since we can hoist any PIC calculations out of the loop.
10706      Thus the call to rtx_varies_p.  */
10707   if (LOOP_INFO (loop)->has_call)
10708     for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
10709       if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i)
10710           && rtx_varies_p (regno_reg_rtx[i], 1))
10711         {
10712           regs->array[i].may_not_optimize = 1;
10713           regs->array[i].set_in_loop = 1;
10714         }
10715
10716 #ifdef AVOID_CCMODE_COPIES
10717   /* Don't try to move insns which set CC registers if we should not
10718      create CCmode register copies.  */
10719   for (i = regs->num - 1; i >= FIRST_PSEUDO_REGISTER; i--)
10720     if (GET_MODE_CLASS (GET_MODE (regno_reg_rtx[i])) == MODE_CC)
10721       regs->array[i].may_not_optimize = 1;
10722 #endif
10723
10724   /* Set regs->array[I].n_times_set for the new registers.  */
10725   for (i = old_nregs; i < regs->num; i++)
10726     regs->array[i].n_times_set = regs->array[i].set_in_loop;
10727
10728   free (last_set);
10729 }
10730
10731 /* Returns the number of real INSNs in the LOOP.  */
10732
10733 static int
10734 count_insns_in_loop (const struct loop *loop)
10735 {
10736   int count = 0;
10737   rtx insn;
10738
10739   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
10740        insn = NEXT_INSN (insn))
10741     if (INSN_P (insn))
10742       ++count;
10743
10744   return count;
10745 }
10746
10747 /* Move MEMs into registers for the duration of the loop.  */
10748
10749 static void
10750 load_mems (const struct loop *loop)
10751 {
10752   struct loop_info *loop_info = LOOP_INFO (loop);
10753   struct loop_regs *regs = LOOP_REGS (loop);
10754   int maybe_never = 0;
10755   int i;
10756   rtx p, prev_ebb_head;
10757   rtx label = NULL_RTX;
10758   rtx end_label;
10759   /* Nonzero if the next instruction may never be executed.  */
10760   int next_maybe_never = 0;
10761   unsigned int last_max_reg = max_reg_num ();
10762
10763   if (loop_info->mems_idx == 0)
10764     return;
10765
10766   /* We cannot use next_label here because it skips over normal insns.  */
10767   end_label = next_nonnote_insn (loop->end);
10768   if (end_label && !LABEL_P (end_label))
10769     end_label = NULL_RTX;
10770
10771   /* Check to see if it's possible that some instructions in the loop are
10772      never executed.  Also check if there is a goto out of the loop other
10773      than right after the end of the loop.  */
10774   for (p = next_insn_in_loop (loop, loop->scan_start);
10775        p != NULL_RTX;
10776        p = next_insn_in_loop (loop, p))
10777     {
10778       if (LABEL_P (p))
10779         maybe_never = 1;
10780       else if (JUMP_P (p)
10781                /* If we enter the loop in the middle, and scan
10782                   around to the beginning, don't set maybe_never
10783                   for that.  This must be an unconditional jump,
10784                   otherwise the code at the top of the loop might
10785                   never be executed.  Unconditional jumps are
10786                   followed a by barrier then loop end.  */
10787                && ! (JUMP_P (p)
10788                      && JUMP_LABEL (p) == loop->top
10789                      && NEXT_INSN (NEXT_INSN (p)) == loop->end
10790                      && any_uncondjump_p (p)))
10791         {
10792           /* If this is a jump outside of the loop but not right
10793              after the end of the loop, we would have to emit new fixup
10794              sequences for each such label.  */
10795           if (/* If we can't tell where control might go when this
10796                  JUMP_INSN is executed, we must be conservative.  */
10797               !JUMP_LABEL (p)
10798               || (JUMP_LABEL (p) != end_label
10799                   && (INSN_UID (JUMP_LABEL (p)) >= max_uid_for_loop
10800                       || INSN_LUID (JUMP_LABEL (p)) < INSN_LUID (loop->start)
10801                       || INSN_LUID (JUMP_LABEL (p)) > INSN_LUID (loop->end))))
10802             return;
10803
10804           if (!any_condjump_p (p))
10805             /* Something complicated.  */
10806             maybe_never = 1;
10807           else
10808             /* If there are any more instructions in the loop, they
10809                might not be reached.  */
10810             next_maybe_never = 1;
10811         }
10812       else if (next_maybe_never)
10813         maybe_never = 1;
10814     }
10815
10816   /* Find start of the extended basic block that enters the loop.  */
10817   for (p = loop->start;
10818        PREV_INSN (p) && !LABEL_P (p);
10819        p = PREV_INSN (p))
10820     ;
10821   prev_ebb_head = p;
10822
10823   cselib_init (true);
10824
10825   /* Build table of mems that get set to constant values before the
10826      loop.  */
10827   for (; p != loop->start; p = NEXT_INSN (p))
10828     cselib_process_insn (p);
10829
10830   /* Actually move the MEMs.  */
10831   for (i = 0; i < loop_info->mems_idx; ++i)
10832     {
10833       regset_head load_copies;
10834       regset_head store_copies;
10835       int written = 0;
10836       rtx reg;
10837       rtx mem = loop_info->mems[i].mem;
10838       rtx mem_list_entry;
10839
10840       if (MEM_VOLATILE_P (mem)
10841           || loop_invariant_p (loop, XEXP (mem, 0)) != 1)
10842         /* There's no telling whether or not MEM is modified.  */
10843         loop_info->mems[i].optimize = 0;
10844
10845       /* Go through the MEMs written to in the loop to see if this
10846          one is aliased by one of them.  */
10847       mem_list_entry = loop_info->store_mems;
10848       while (mem_list_entry)
10849         {
10850           if (rtx_equal_p (mem, XEXP (mem_list_entry, 0)))
10851             written = 1;
10852           else if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
10853                                     mem, rtx_varies_p))
10854             {
10855               /* MEM is indeed aliased by this store.  */
10856               loop_info->mems[i].optimize = 0;
10857               break;
10858             }
10859           mem_list_entry = XEXP (mem_list_entry, 1);
10860         }
10861
10862       if (flag_float_store && written
10863           && GET_MODE_CLASS (GET_MODE (mem)) == MODE_FLOAT)
10864         loop_info->mems[i].optimize = 0;
10865
10866       /* If this MEM is written to, we must be sure that there
10867          are no reads from another MEM that aliases this one.  */
10868       if (loop_info->mems[i].optimize && written)
10869         {
10870           int j;
10871
10872           for (j = 0; j < loop_info->mems_idx; ++j)
10873             {
10874               if (j == i)
10875                 continue;
10876               else if (true_dependence (mem,
10877                                         VOIDmode,
10878                                         loop_info->mems[j].mem,
10879                                         rtx_varies_p))
10880                 {
10881                   /* It's not safe to hoist loop_info->mems[i] out of
10882                      the loop because writes to it might not be
10883                      seen by reads from loop_info->mems[j].  */
10884                   loop_info->mems[i].optimize = 0;
10885                   break;
10886                 }
10887             }
10888         }
10889
10890       if (maybe_never && may_trap_p (mem))
10891         /* We can't access the MEM outside the loop; it might
10892            cause a trap that wouldn't have happened otherwise.  */
10893         loop_info->mems[i].optimize = 0;
10894
10895       if (!loop_info->mems[i].optimize)
10896         /* We thought we were going to lift this MEM out of the
10897            loop, but later discovered that we could not.  */
10898         continue;
10899
10900       INIT_REG_SET (&load_copies);
10901       INIT_REG_SET (&store_copies);
10902
10903       /* Allocate a pseudo for this MEM.  We set REG_USERVAR_P in
10904          order to keep scan_loop from moving stores to this MEM
10905          out of the loop just because this REG is neither a
10906          user-variable nor used in the loop test.  */
10907       reg = gen_reg_rtx (GET_MODE (mem));
10908       REG_USERVAR_P (reg) = 1;
10909       loop_info->mems[i].reg = reg;
10910
10911       /* Now, replace all references to the MEM with the
10912          corresponding pseudos.  */
10913       maybe_never = 0;
10914       for (p = next_insn_in_loop (loop, loop->scan_start);
10915            p != NULL_RTX;
10916            p = next_insn_in_loop (loop, p))
10917         {
10918           if (INSN_P (p))
10919             {
10920               rtx set;
10921
10922               set = single_set (p);
10923
10924               /* See if this copies the mem into a register that isn't
10925                  modified afterwards.  We'll try to do copy propagation
10926                  a little further on.  */
10927               if (set
10928                   /* @@@ This test is _way_ too conservative.  */
10929                   && ! maybe_never
10930                   && REG_P (SET_DEST (set))
10931                   && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER
10932                   && REGNO (SET_DEST (set)) < last_max_reg
10933                   && regs->array[REGNO (SET_DEST (set))].n_times_set == 1
10934                   && rtx_equal_p (SET_SRC (set), mem))
10935                 SET_REGNO_REG_SET (&load_copies, REGNO (SET_DEST (set)));
10936
10937               /* See if this copies the mem from a register that isn't
10938                  modified afterwards.  We'll try to remove the
10939                  redundant copy later on by doing a little register
10940                  renaming and copy propagation.   This will help
10941                  to untangle things for the BIV detection code.  */
10942               if (set
10943                   && ! maybe_never
10944                   && REG_P (SET_SRC (set))
10945                   && REGNO (SET_SRC (set)) >= FIRST_PSEUDO_REGISTER
10946                   && REGNO (SET_SRC (set)) < last_max_reg
10947                   && regs->array[REGNO (SET_SRC (set))].n_times_set == 1
10948                   && rtx_equal_p (SET_DEST (set), mem))
10949                 SET_REGNO_REG_SET (&store_copies, REGNO (SET_SRC (set)));
10950
10951               /* If this is a call which uses / clobbers this memory
10952                  location, we must not change the interface here.  */
10953               if (CALL_P (p)
10954                   && reg_mentioned_p (loop_info->mems[i].mem,
10955                                       CALL_INSN_FUNCTION_USAGE (p)))
10956                 {
10957                   cancel_changes (0);
10958                   loop_info->mems[i].optimize = 0;
10959                   break;
10960                 }
10961               else
10962                 /* Replace the memory reference with the shadow register.  */
10963                 replace_loop_mems (p, loop_info->mems[i].mem,
10964                                    loop_info->mems[i].reg, written);
10965             }
10966
10967           if (LABEL_P (p)
10968               || JUMP_P (p))
10969             maybe_never = 1;
10970         }
10971
10972       if (! loop_info->mems[i].optimize)
10973         ; /* We found we couldn't do the replacement, so do nothing.  */
10974       else if (! apply_change_group ())
10975         /* We couldn't replace all occurrences of the MEM.  */
10976         loop_info->mems[i].optimize = 0;
10977       else
10978         {
10979           /* Load the memory immediately before LOOP->START, which is
10980              the NOTE_LOOP_BEG.  */
10981           cselib_val *e = cselib_lookup (mem, VOIDmode, 0);
10982           rtx set;
10983           rtx best = mem;
10984           unsigned j;
10985           struct elt_loc_list *const_equiv = 0;
10986           reg_set_iterator rsi;
10987
10988           if (e)
10989             {
10990               struct elt_loc_list *equiv;
10991               struct elt_loc_list *best_equiv = 0;
10992               for (equiv = e->locs; equiv; equiv = equiv->next)
10993                 {
10994                   if (CONSTANT_P (equiv->loc))
10995                     const_equiv = equiv;
10996                   else if (REG_P (equiv->loc)
10997                            /* Extending hard register lifetimes causes crash
10998                               on SRC targets.  Doing so on non-SRC is
10999                               probably also not good idea, since we most
11000                               probably have pseudoregister equivalence as
11001                               well.  */
11002                            && REGNO (equiv->loc) >= FIRST_PSEUDO_REGISTER)
11003                     best_equiv = equiv;
11004                 }
11005               /* Use the constant equivalence if that is cheap enough.  */
11006               if (! best_equiv)
11007                 best_equiv = const_equiv;
11008               else if (const_equiv
11009                        && (rtx_cost (const_equiv->loc, SET)
11010                            <= rtx_cost (best_equiv->loc, SET)))
11011                 {
11012                   best_equiv = const_equiv;
11013                   const_equiv = 0;
11014                 }
11015
11016               /* If best_equiv is nonzero, we know that MEM is set to a
11017                  constant or register before the loop.  We will use this
11018                  knowledge to initialize the shadow register with that
11019                  constant or reg rather than by loading from MEM.  */
11020               if (best_equiv)
11021                 best = copy_rtx (best_equiv->loc);
11022             }
11023
11024           set = gen_move_insn (reg, best);
11025           set = loop_insn_hoist (loop, set);
11026           if (REG_P (best))
11027             {
11028               for (p = prev_ebb_head; p != loop->start; p = NEXT_INSN (p))
11029                 if (REGNO_LAST_UID (REGNO (best)) == INSN_UID (p))
11030                   {
11031                     REGNO_LAST_UID (REGNO (best)) = INSN_UID (set);
11032                     break;
11033                   }
11034             }
11035
11036           if (const_equiv)
11037             set_unique_reg_note (set, REG_EQUAL, copy_rtx (const_equiv->loc));
11038
11039           if (written)
11040             {
11041               if (label == NULL_RTX)
11042                 {
11043                   label = gen_label_rtx ();
11044                   emit_label_after (label, loop->end);
11045                 }
11046
11047               /* Store the memory immediately after END, which is
11048                  the NOTE_LOOP_END.  */
11049               set = gen_move_insn (copy_rtx (mem), reg);
11050               loop_insn_emit_after (loop, 0, label, set);
11051             }
11052
11053           if (loop_dump_stream)
11054             {
11055               fprintf (loop_dump_stream, "Hoisted regno %d %s from ",
11056                        REGNO (reg), (written ? "r/w" : "r/o"));
11057               print_rtl (loop_dump_stream, mem);
11058               fputc ('\n', loop_dump_stream);
11059             }
11060
11061           /* Attempt a bit of copy propagation.  This helps untangle the
11062              data flow, and enables {basic,general}_induction_var to find
11063              more bivs/givs.  */
11064           EXECUTE_IF_SET_IN_REG_SET
11065             (&load_copies, FIRST_PSEUDO_REGISTER, j, rsi)
11066             {
11067               try_copy_prop (loop, reg, j);
11068             }
11069           CLEAR_REG_SET (&load_copies);
11070
11071           EXECUTE_IF_SET_IN_REG_SET
11072             (&store_copies, FIRST_PSEUDO_REGISTER, j, rsi)
11073             {
11074               try_swap_copy_prop (loop, reg, j);
11075             }
11076           CLEAR_REG_SET (&store_copies);
11077         }
11078     }
11079
11080   /* Now, we need to replace all references to the previous exit
11081      label with the new one.  */
11082   if (label != NULL_RTX && end_label != NULL_RTX)
11083     for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
11084       if (JUMP_P (p) && JUMP_LABEL (p) == end_label)
11085         redirect_jump (p, label, false);
11086
11087   cselib_finish ();
11088 }
11089
11090 /* For communication between note_reg_stored and its caller.  */
11091 struct note_reg_stored_arg
11092 {
11093   int set_seen;
11094   rtx reg;
11095 };
11096
11097 /* Called via note_stores, record in SET_SEEN whether X, which is written,
11098    is equal to ARG.  */
11099 static void
11100 note_reg_stored (rtx x, rtx setter ATTRIBUTE_UNUSED, void *arg)
11101 {
11102   struct note_reg_stored_arg *t = (struct note_reg_stored_arg *) arg;
11103   if (t->reg == x)
11104     t->set_seen = 1;
11105 }
11106
11107 /* Try to replace every occurrence of pseudo REGNO with REPLACEMENT.
11108    There must be exactly one insn that sets this pseudo; it will be
11109    deleted if all replacements succeed and we can prove that the register
11110    is not used after the loop.  */
11111
11112 static void
11113 try_copy_prop (const struct loop *loop, rtx replacement, unsigned int regno)
11114 {
11115   /* This is the reg that we are copying from.  */
11116   rtx reg_rtx = regno_reg_rtx[regno];
11117   rtx init_insn = 0;
11118   rtx insn;
11119   /* These help keep track of whether we replaced all uses of the reg.  */
11120   int replaced_last = 0;
11121   int store_is_first = 0;
11122
11123   for (insn = next_insn_in_loop (loop, loop->scan_start);
11124        insn != NULL_RTX;
11125        insn = next_insn_in_loop (loop, insn))
11126     {
11127       rtx set;
11128
11129       /* Only substitute within one extended basic block from the initializing
11130          insn.  */
11131       if (LABEL_P (insn) && init_insn)
11132         break;
11133
11134       if (! INSN_P (insn))
11135         continue;
11136
11137       /* Is this the initializing insn?  */
11138       set = single_set (insn);
11139       if (set
11140           && REG_P (SET_DEST (set))
11141           && REGNO (SET_DEST (set)) == regno)
11142         {
11143           gcc_assert (!init_insn);
11144
11145           init_insn = insn;
11146           if (REGNO_FIRST_UID (regno) == INSN_UID (insn))
11147             store_is_first = 1;
11148         }
11149
11150       /* Only substitute after seeing the initializing insn.  */
11151       if (init_insn && insn != init_insn)
11152         {
11153           struct note_reg_stored_arg arg;
11154
11155           replace_loop_regs (insn, reg_rtx, replacement);
11156           if (REGNO_LAST_UID (regno) == INSN_UID (insn))
11157             replaced_last = 1;
11158
11159           /* Stop replacing when REPLACEMENT is modified.  */
11160           arg.reg = replacement;
11161           arg.set_seen = 0;
11162           note_stores (PATTERN (insn), note_reg_stored, &arg);
11163           if (arg.set_seen)
11164             {
11165               rtx note = find_reg_note (insn, REG_EQUAL, NULL);
11166
11167               /* It is possible that we've turned previously valid REG_EQUAL to
11168                  invalid, as we change the REGNO to REPLACEMENT and unlike REGNO,
11169                  REPLACEMENT is modified, we get different meaning.  */
11170               if (note && reg_mentioned_p (replacement, XEXP (note, 0)))
11171                 remove_note (insn, note);
11172               break;
11173             }
11174         }
11175     }
11176   gcc_assert (init_insn);
11177   if (apply_change_group ())
11178     {
11179       if (loop_dump_stream)
11180         fprintf (loop_dump_stream, "  Replaced reg %d", regno);
11181       if (store_is_first && replaced_last)
11182         {
11183           rtx first;
11184           rtx retval_note;
11185
11186           /* Assume we're just deleting INIT_INSN.  */
11187           first = init_insn;
11188           /* Look for REG_RETVAL note.  If we're deleting the end of
11189              the libcall sequence, the whole sequence can go.  */
11190           retval_note = find_reg_note (init_insn, REG_RETVAL, NULL_RTX);
11191           /* If we found a REG_RETVAL note, find the first instruction
11192              in the sequence.  */
11193           if (retval_note)
11194             first = XEXP (retval_note, 0);
11195
11196           /* Delete the instructions.  */
11197           loop_delete_insns (first, init_insn);
11198         }
11199       if (loop_dump_stream)
11200         fprintf (loop_dump_stream, ".\n");
11201     }
11202 }
11203
11204 /* Replace all the instructions from FIRST up to and including LAST
11205    with NOTE_INSN_DELETED notes.  */
11206
11207 static void
11208 loop_delete_insns (rtx first, rtx last)
11209 {
11210   while (1)
11211     {
11212       if (loop_dump_stream)
11213         fprintf (loop_dump_stream, ", deleting init_insn (%d)",
11214                  INSN_UID (first));
11215       delete_insn (first);
11216
11217       /* If this was the LAST instructions we're supposed to delete,
11218          we're done.  */
11219       if (first == last)
11220         break;
11221
11222       first = NEXT_INSN (first);
11223     }
11224 }
11225
11226 /* Try to replace occurrences of pseudo REGNO with REPLACEMENT within
11227    loop LOOP if the order of the sets of these registers can be
11228    swapped.  There must be exactly one insn within the loop that sets
11229    this pseudo followed immediately by a move insn that sets
11230    REPLACEMENT with REGNO.  */
11231 static void
11232 try_swap_copy_prop (const struct loop *loop, rtx replacement,
11233                     unsigned int regno)
11234 {
11235   rtx insn;
11236   rtx set = NULL_RTX;
11237   unsigned int new_regno;
11238
11239   new_regno = REGNO (replacement);
11240
11241   for (insn = next_insn_in_loop (loop, loop->scan_start);
11242        insn != NULL_RTX;
11243        insn = next_insn_in_loop (loop, insn))
11244     {
11245       /* Search for the insn that copies REGNO to NEW_REGNO?  */
11246       if (INSN_P (insn)
11247           && (set = single_set (insn))
11248           && REG_P (SET_DEST (set))
11249           && REGNO (SET_DEST (set)) == new_regno
11250           && REG_P (SET_SRC (set))
11251           && REGNO (SET_SRC (set)) == regno)
11252         break;
11253     }
11254
11255   if (insn != NULL_RTX)
11256     {
11257       rtx prev_insn;
11258       rtx prev_set;
11259
11260       /* Some DEF-USE info would come in handy here to make this
11261          function more general.  For now, just check the previous insn
11262          which is the most likely candidate for setting REGNO.  */
11263
11264       prev_insn = PREV_INSN (insn);
11265
11266       if (INSN_P (insn)
11267           && (prev_set = single_set (prev_insn))
11268           && REG_P (SET_DEST (prev_set))
11269           && REGNO (SET_DEST (prev_set)) == regno)
11270         {
11271           /* We have:
11272              (set (reg regno) (expr))
11273              (set (reg new_regno) (reg regno))
11274
11275              so try converting this to:
11276              (set (reg new_regno) (expr))
11277              (set (reg regno) (reg new_regno))
11278
11279              The former construct is often generated when a global
11280              variable used for an induction variable is shadowed by a
11281              register (NEW_REGNO).  The latter construct improves the
11282              chances of GIV replacement and BIV elimination.  */
11283
11284           validate_change (prev_insn, &SET_DEST (prev_set),
11285                            replacement, 1);
11286           validate_change (insn, &SET_DEST (set),
11287                            SET_SRC (set), 1);
11288           validate_change (insn, &SET_SRC (set),
11289                            replacement, 1);
11290
11291           if (apply_change_group ())
11292             {
11293               if (loop_dump_stream)
11294                 fprintf (loop_dump_stream,
11295                          "  Swapped set of reg %d at %d with reg %d at %d.\n",
11296                          regno, INSN_UID (insn),
11297                          new_regno, INSN_UID (prev_insn));
11298
11299               /* Update first use of REGNO.  */
11300               if (REGNO_FIRST_UID (regno) == INSN_UID (prev_insn))
11301                 REGNO_FIRST_UID (regno) = INSN_UID (insn);
11302
11303               /* Now perform copy propagation to hopefully
11304                  remove all uses of REGNO within the loop.  */
11305               try_copy_prop (loop, replacement, regno);
11306             }
11307         }
11308     }
11309 }
11310
11311 /* Worker function for find_mem_in_note, called via for_each_rtx.  */
11312
11313 static int
11314 find_mem_in_note_1 (rtx *x, void *data)
11315 {
11316   if (*x != NULL_RTX && MEM_P (*x))
11317     {
11318       rtx *res = (rtx *) data;
11319       *res = *x;
11320       return 1;
11321     }
11322   return 0;
11323 }
11324
11325 /* Returns the first MEM found in NOTE by depth-first search.  */
11326
11327 static rtx
11328 find_mem_in_note (rtx note)
11329 {
11330   if (note && for_each_rtx (&note, find_mem_in_note_1, &note))
11331     return note;
11332   return NULL_RTX;
11333 }
11334
11335 /* Replace MEM with its associated pseudo register.  This function is
11336    called from load_mems via for_each_rtx.  DATA is actually a pointer
11337    to a structure describing the instruction currently being scanned
11338    and the MEM we are currently replacing.  */
11339
11340 static int
11341 replace_loop_mem (rtx *mem, void *data)
11342 {
11343   loop_replace_args *args = (loop_replace_args *) data;
11344   rtx m = *mem;
11345
11346   if (m == NULL_RTX)
11347     return 0;
11348
11349   switch (GET_CODE (m))
11350     {
11351     case MEM:
11352       break;
11353
11354     case CONST_DOUBLE:
11355       /* We're not interested in the MEM associated with a
11356          CONST_DOUBLE, so there's no need to traverse into one.  */
11357       return -1;
11358
11359     default:
11360       /* This is not a MEM.  */
11361       return 0;
11362     }
11363
11364   if (!rtx_equal_p (args->match, m))
11365     /* This is not the MEM we are currently replacing.  */
11366     return 0;
11367
11368   /* Actually replace the MEM.  */
11369   validate_change (args->insn, mem, args->replacement, 1);
11370
11371   return 0;
11372 }
11373
11374 static void
11375 replace_loop_mems (rtx insn, rtx mem, rtx reg, int written)
11376 {
11377   loop_replace_args args;
11378
11379   args.insn = insn;
11380   args.match = mem;
11381   args.replacement = reg;
11382
11383   for_each_rtx (&insn, replace_loop_mem, &args);
11384
11385   /* If we hoist a mem write out of the loop, then REG_EQUAL
11386      notes referring to the mem are no longer valid.  */
11387   if (written)
11388     {
11389       rtx note, sub;
11390       rtx *link;
11391
11392       for (link = &REG_NOTES (insn); (note = *link); link = &XEXP (note, 1))
11393         {
11394           if (REG_NOTE_KIND (note) == REG_EQUAL
11395               && (sub = find_mem_in_note (note))
11396               && true_dependence (mem, VOIDmode, sub, rtx_varies_p))
11397             {
11398               /* Remove the note.  */
11399               validate_change (NULL_RTX, link, XEXP (note, 1), 1);
11400               break;
11401             }
11402         }
11403     }
11404 }
11405
11406 /* Replace one register with another.  Called through for_each_rtx; PX points
11407    to the rtx being scanned.  DATA is actually a pointer to
11408    a structure of arguments.  */
11409
11410 static int
11411 replace_loop_reg (rtx *px, void *data)
11412 {
11413   rtx x = *px;
11414   loop_replace_args *args = (loop_replace_args *) data;
11415
11416   if (x == NULL_RTX)
11417     return 0;
11418
11419   if (x == args->match)
11420     validate_change (args->insn, px, args->replacement, 1);
11421
11422   return 0;
11423 }
11424
11425 static void
11426 replace_loop_regs (rtx insn, rtx reg, rtx replacement)
11427 {
11428   loop_replace_args args;
11429
11430   args.insn = insn;
11431   args.match = reg;
11432   args.replacement = replacement;
11433
11434   for_each_rtx (&insn, replace_loop_reg, &args);
11435 }
11436 \f
11437 /* Emit insn for PATTERN after WHERE_INSN in basic block WHERE_BB
11438    (ignored in the interim).  */
11439
11440 static rtx
11441 loop_insn_emit_after (const struct loop *loop ATTRIBUTE_UNUSED,
11442                       basic_block where_bb ATTRIBUTE_UNUSED, rtx where_insn,
11443                       rtx pattern)
11444 {
11445   return emit_insn_after (pattern, where_insn);
11446 }
11447
11448
11449 /* If WHERE_INSN is nonzero emit insn for PATTERN before WHERE_INSN
11450    in basic block WHERE_BB (ignored in the interim) within the loop
11451    otherwise hoist PATTERN into the loop pre-header.  */
11452
11453 static rtx
11454 loop_insn_emit_before (const struct loop *loop,
11455                        basic_block where_bb ATTRIBUTE_UNUSED,
11456                        rtx where_insn, rtx pattern)
11457 {
11458   if (! where_insn)
11459     return loop_insn_hoist (loop, pattern);
11460   return emit_insn_before (pattern, where_insn);
11461 }
11462
11463
11464 /* Emit call insn for PATTERN before WHERE_INSN in basic block
11465    WHERE_BB (ignored in the interim) within the loop.  */
11466
11467 static rtx
11468 loop_call_insn_emit_before (const struct loop *loop ATTRIBUTE_UNUSED,
11469                             basic_block where_bb ATTRIBUTE_UNUSED,
11470                             rtx where_insn, rtx pattern)
11471 {
11472   return emit_call_insn_before (pattern, where_insn);
11473 }
11474
11475
11476 /* Hoist insn for PATTERN into the loop pre-header.  */
11477
11478 static rtx
11479 loop_insn_hoist (const struct loop *loop, rtx pattern)
11480 {
11481   return loop_insn_emit_before (loop, 0, loop->start, pattern);
11482 }
11483
11484
11485 /* Hoist call insn for PATTERN into the loop pre-header.  */
11486
11487 static rtx
11488 loop_call_insn_hoist (const struct loop *loop, rtx pattern)
11489 {
11490   return loop_call_insn_emit_before (loop, 0, loop->start, pattern);
11491 }
11492
11493
11494 /* Sink insn for PATTERN after the loop end.  */
11495
11496 static rtx
11497 loop_insn_sink (const struct loop *loop, rtx pattern)
11498 {
11499   return loop_insn_emit_before (loop, 0, loop->sink, pattern);
11500 }
11501
11502 /* bl->final_value can be either general_operand or PLUS of general_operand
11503    and constant.  Emit sequence of instructions to load it into REG.  */
11504 static rtx
11505 gen_load_of_final_value (rtx reg, rtx final_value)
11506 {
11507   rtx seq;
11508   start_sequence ();
11509   final_value = force_operand (final_value, reg);
11510   if (final_value != reg)
11511     emit_move_insn (reg, final_value);
11512   seq = get_insns ();
11513   end_sequence ();
11514   return seq;
11515 }
11516
11517 /* If the loop has multiple exits, emit insn for PATTERN before the
11518    loop to ensure that it will always be executed no matter how the
11519    loop exits.  Otherwise, emit the insn for PATTERN after the loop,
11520    since this is slightly more efficient.  */
11521
11522 static rtx
11523 loop_insn_sink_or_swim (const struct loop *loop, rtx pattern)
11524 {
11525   if (loop->exit_count)
11526     return loop_insn_hoist (loop, pattern);
11527   else
11528     return loop_insn_sink (loop, pattern);
11529 }
11530 \f
11531 static void
11532 loop_ivs_dump (const struct loop *loop, FILE *file, int verbose)
11533 {
11534   struct iv_class *bl;
11535   int iv_num = 0;
11536
11537   if (! loop || ! file)
11538     return;
11539
11540   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
11541     iv_num++;
11542
11543   fprintf (file, "Loop %d: %d IV classes\n", loop->num, iv_num);
11544
11545   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
11546     {
11547       loop_iv_class_dump (bl, file, verbose);
11548       fputc ('\n', file);
11549     }
11550 }
11551
11552
11553 static void
11554 loop_iv_class_dump (const struct iv_class *bl, FILE *file,
11555                     int verbose ATTRIBUTE_UNUSED)
11556 {
11557   struct induction *v;
11558   rtx incr;
11559   int i;
11560
11561   if (! bl || ! file)
11562     return;
11563
11564   fprintf (file, "IV class for reg %d, benefit %d\n",
11565            bl->regno, bl->total_benefit);
11566
11567   fprintf (file, " Init insn %d", INSN_UID (bl->init_insn));
11568   if (bl->initial_value)
11569     {
11570       fprintf (file, ", init val: ");
11571       print_simple_rtl (file, bl->initial_value);
11572     }
11573   if (bl->initial_test)
11574     {
11575       fprintf (file, ", init test: ");
11576       print_simple_rtl (file, bl->initial_test);
11577     }
11578   fputc ('\n', file);
11579
11580   if (bl->final_value)
11581     {
11582       fprintf (file, " Final val: ");
11583       print_simple_rtl (file, bl->final_value);
11584       fputc ('\n', file);
11585     }
11586
11587   if ((incr = biv_total_increment (bl)))
11588     {
11589       fprintf (file, " Total increment: ");
11590       print_simple_rtl (file, incr);
11591       fputc ('\n', file);
11592     }
11593
11594   /* List the increments.  */
11595   for (i = 0, v = bl->biv; v; v = v->next_iv, i++)
11596     {
11597       fprintf (file, " Inc%d: insn %d, incr: ", i, INSN_UID (v->insn));
11598       print_simple_rtl (file, v->add_val);
11599       fputc ('\n', file);
11600     }
11601
11602   /* List the givs.  */
11603   for (i = 0, v = bl->giv; v; v = v->next_iv, i++)
11604     {
11605       fprintf (file, " Giv%d: insn %d, benefit %d, ",
11606                i, INSN_UID (v->insn), v->benefit);
11607       if (v->giv_type == DEST_ADDR)
11608         print_simple_rtl (file, v->mem);
11609       else
11610         print_simple_rtl (file, single_set (v->insn));
11611       fputc ('\n', file);
11612     }
11613 }
11614
11615
11616 static void
11617 loop_biv_dump (const struct induction *v, FILE *file, int verbose)
11618 {
11619   if (! v || ! file)
11620     return;
11621
11622   fprintf (file,
11623            "Biv %d: insn %d",
11624            REGNO (v->dest_reg), INSN_UID (v->insn));
11625   fprintf (file, " const ");
11626   print_simple_rtl (file, v->add_val);
11627
11628   if (verbose && v->final_value)
11629     {
11630       fputc ('\n', file);
11631       fprintf (file, " final ");
11632       print_simple_rtl (file, v->final_value);
11633     }
11634
11635   fputc ('\n', file);
11636 }
11637
11638
11639 static void
11640 loop_giv_dump (const struct induction *v, FILE *file, int verbose)
11641 {
11642   if (! v || ! file)
11643     return;
11644
11645   if (v->giv_type == DEST_REG)
11646     fprintf (file, "Giv %d: insn %d",
11647              REGNO (v->dest_reg), INSN_UID (v->insn));
11648   else
11649     fprintf (file, "Dest address: insn %d",
11650              INSN_UID (v->insn));
11651
11652   fprintf (file, " src reg %d benefit %d",
11653            REGNO (v->src_reg), v->benefit);
11654   fprintf (file, " lifetime %d",
11655            v->lifetime);
11656
11657   if (v->replaceable)
11658     fprintf (file, " replaceable");
11659
11660   if (v->no_const_addval)
11661     fprintf (file, " ncav");
11662
11663   if (v->ext_dependent)
11664     {
11665       switch (GET_CODE (v->ext_dependent))
11666         {
11667         case SIGN_EXTEND:
11668           fprintf (file, " ext se");
11669           break;
11670         case ZERO_EXTEND:
11671           fprintf (file, " ext ze");
11672           break;
11673         case TRUNCATE:
11674           fprintf (file, " ext tr");
11675           break;
11676         default:
11677           gcc_unreachable ();
11678         }
11679     }
11680
11681   fputc ('\n', file);
11682   fprintf (file, " mult ");
11683   print_simple_rtl (file, v->mult_val);
11684
11685   fputc ('\n', file);
11686   fprintf (file, " add  ");
11687   print_simple_rtl (file, v->add_val);
11688
11689   if (verbose && v->final_value)
11690     {
11691       fputc ('\n', file);
11692       fprintf (file, " final ");
11693       print_simple_rtl (file, v->final_value);
11694     }
11695
11696   fputc ('\n', file);
11697 }
11698
11699
11700 void
11701 debug_ivs (const struct loop *loop)
11702 {
11703   loop_ivs_dump (loop, stderr, 1);
11704 }
11705
11706
11707 void
11708 debug_iv_class (const struct iv_class *bl)
11709 {
11710   loop_iv_class_dump (bl, stderr, 1);
11711 }
11712
11713
11714 void
11715 debug_biv (const struct induction *v)
11716 {
11717   loop_biv_dump (v, stderr, 1);
11718 }
11719
11720
11721 void
11722 debug_giv (const struct induction *v)
11723 {
11724   loop_giv_dump (v, stderr, 1);
11725 }
11726
11727
11728 #define LOOP_BLOCK_NUM_1(INSN) \
11729 ((INSN) ? (BLOCK_FOR_INSN (INSN) ? BLOCK_NUM (INSN) : - 1) : -1)
11730
11731 /* The notes do not have an assigned block, so look at the next insn.  */
11732 #define LOOP_BLOCK_NUM(INSN) \
11733 ((INSN) ? (NOTE_P (INSN) \
11734             ? LOOP_BLOCK_NUM_1 (next_nonnote_insn (INSN)) \
11735             : LOOP_BLOCK_NUM_1 (INSN)) \
11736         : -1)
11737
11738 #define LOOP_INSN_UID(INSN) ((INSN) ? INSN_UID (INSN) : -1)
11739
11740 static void
11741 loop_dump_aux (const struct loop *loop, FILE *file,
11742                int verbose ATTRIBUTE_UNUSED)
11743 {
11744   rtx label;
11745
11746   if (! loop || ! file || !BB_HEAD (loop->first))
11747     return;
11748
11749   /* Print diagnostics to compare our concept of a loop with
11750      what the loop notes say.  */
11751   if (! PREV_INSN (BB_HEAD (loop->first))
11752       || !NOTE_P (PREV_INSN (BB_HEAD (loop->first)))
11753       || NOTE_LINE_NUMBER (PREV_INSN (BB_HEAD (loop->first)))
11754       != NOTE_INSN_LOOP_BEG)
11755     fprintf (file, ";;  No NOTE_INSN_LOOP_BEG at %d\n",
11756              INSN_UID (PREV_INSN (BB_HEAD (loop->first))));
11757   if (! NEXT_INSN (BB_END (loop->last))
11758       || !NOTE_P (NEXT_INSN (BB_END (loop->last)))
11759       || NOTE_LINE_NUMBER (NEXT_INSN (BB_END (loop->last)))
11760       != NOTE_INSN_LOOP_END)
11761     fprintf (file, ";;  No NOTE_INSN_LOOP_END at %d\n",
11762              INSN_UID (NEXT_INSN (BB_END (loop->last))));
11763
11764   if (loop->start)
11765     {
11766       fprintf (file,
11767                ";;  start %d (%d), end %d (%d)\n",
11768                LOOP_BLOCK_NUM (loop->start),
11769                LOOP_INSN_UID (loop->start),
11770                LOOP_BLOCK_NUM (loop->end),
11771                LOOP_INSN_UID (loop->end));
11772       fprintf (file, ";;  top %d (%d), scan start %d (%d)\n",
11773                LOOP_BLOCK_NUM (loop->top),
11774                LOOP_INSN_UID (loop->top),
11775                LOOP_BLOCK_NUM (loop->scan_start),
11776                LOOP_INSN_UID (loop->scan_start));
11777       fprintf (file, ";;  exit_count %d", loop->exit_count);
11778       if (loop->exit_count)
11779         {
11780           fputs (", labels:", file);
11781           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
11782             {
11783               fprintf (file, " %d ",
11784                        LOOP_INSN_UID (XEXP (label, 0)));
11785             }
11786         }
11787       fputs ("\n", file);
11788     }
11789 }
11790
11791 /* Call this function from the debugger to dump LOOP.  */
11792
11793 void
11794 debug_loop (const struct loop *loop)
11795 {
11796   flow_loop_dump (loop, stderr, loop_dump_aux, 1);
11797 }
11798
11799 /* Call this function from the debugger to dump LOOPS.  */
11800
11801 void
11802 debug_loops (const struct loops *loops)
11803 {
11804   flow_loops_dump (loops, stderr, loop_dump_aux, 1);
11805 }