gcc/loop.c

   1 /* Perform various loop optimizations, including strength reduction.
   2    Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997,
   3    1998, 1999, 2000, 2001, 2002 Free Software Foundation, Inc.
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 2, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING.  If not, write to the Free
  19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  20 02111-1307, USA.  */
  21
  22 /* This is the loop optimization pass of the compiler.
  23    It finds invariant computations within loops and moves them
  24    to the beginning of the loop.  Then it identifies basic and
  25    general induction variables.  Strength reduction is applied to the general
  26    induction variables, and induction variable elimination is applied to
  27    the basic induction variables.
  28
  29    It also finds cases where
  30    a register is set within the loop by zero-extending a narrower value
  31    and changes these to zero the entire register once before the loop
  32    and merely copy the low part within the loop.
  33
  34    Most of the complexity is in heuristics to decide when it is worth
  35    while to do these things.  */
  36
  37 #include "config.h"
  38 #include "system.h"
  39 #include "rtl.h"
  40 #include "tm_p.h"
  41 #include "obstack.h"
  42 #include "function.h"
  43 #include "expr.h"
  44 #include "hard-reg-set.h"
  45 #include "basic-block.h"
  46 #include "insn-config.h"
  47 #include "regs.h"
  48 #include "recog.h"
  49 #include "flags.h"
  50 #include "real.h"
  51 #include "loop.h"
  52 #include "cselib.h"
  53 #include "except.h"
  54 #include "toplev.h"
  55 #include "predict.h"
  56 #include "insn-flags.h"
  57 #include "optabs.h"
  58
  59 /* Not really meaningful values, but at least something.  */
  60 #ifndef SIMULTANEOUS_PREFETCHES
  61 #define SIMULTANEOUS_PREFETCHES 3
  62 #endif
  63 #ifndef PREFETCH_BLOCK
  64 #define PREFETCH_BLOCK 32
  65 #endif
  66 #ifndef HAVE_prefetch
  67 #define HAVE_prefetch 0
  68 #define CODE_FOR_prefetch 0
  69 #define gen_prefetch(a,b,c) (abort(), NULL_RTX)
  70 #endif
  71
  72 /* Give up the prefetch optimizations once we exceed a given threshhold.
  73    It is unlikely that we would be able to optimize something in a loop
  74    with so many detected prefetches.  */
  75 #define MAX_PREFETCHES 100
  76 /* The number of prefetch blocks that are beneficial to fetch at once before
  77    a loop with a known (and low) iteration count.  */
  78 #define PREFETCH_BLOCKS_BEFORE_LOOP_MAX  6
  79 /* For very tiny loops it is not worthwhile to prefetch even before the loop,
  80    since it is likely that the data are already in the cache.  */
  81 #define PREFETCH_BLOCKS_BEFORE_LOOP_MIN  2
  82 /* The minimal number of prefetch blocks that a loop must consume to make
  83    the emitting of prefetch instruction in the body of loop worthwhile.  */
  84 #define PREFETCH_BLOCKS_IN_LOOP_MIN  6
  85
  86 /* Parameterize some prefetch heuristics so they can be turned on and off
  87    easily for performance testing on new architecures.  These can be
  88    defined in target-dependent files.  */
  89
  90 /* Prefetch is worthwhile only when loads/stores are dense.  */
  91 #ifndef PREFETCH_ONLY_DENSE_MEM
  92 #define PREFETCH_ONLY_DENSE_MEM 1
  93 #endif
  94
  95 /* Define what we mean by "dense" loads and stores; This value divided by 256
  96    is the minimum percentage of memory references that worth prefetching.  */
  97 #ifndef PREFETCH_DENSE_MEM
  98 #define PREFETCH_DENSE_MEM 220
  99 #endif
 100
 101 /* Do not prefetch for a loop whose iteration count is known to be low.  */
 102 #ifndef PREFETCH_NO_LOW_LOOPCNT
 103 #define PREFETCH_NO_LOW_LOOPCNT 1
 104 #endif
 105
 106 /* Define what we mean by a "low" iteration count.  */
 107 #ifndef PREFETCH_LOW_LOOPCNT
 108 #define PREFETCH_LOW_LOOPCNT 32
 109 #endif
 110
 111 /* Do not prefetch for a loop that contains a function call; such a loop is
 112    probably not an internal loop.  */
 113 #ifndef PREFETCH_NO_CALL
 114 #define PREFETCH_NO_CALL 1
 115 #endif
 116
 117 /* Do not prefetch accesses with an extreme stride.  */
 118 #ifndef PREFETCH_NO_EXTREME_STRIDE
 119 #define PREFETCH_NO_EXTREME_STRIDE 1
 120 #endif
 121
 122 /* Define what we mean by an "extreme" stride.  */
 123 #ifndef PREFETCH_EXTREME_STRIDE
 124 #define PREFETCH_EXTREME_STRIDE 4096
 125 #endif
 126
 127 /* Do not handle reversed order prefetches (negative stride).  */
 128 #ifndef PREFETCH_NO_REVERSE_ORDER
 129 #define PREFETCH_NO_REVERSE_ORDER 1
 130 #endif
 131
 132 /* Prefetch even if the GIV is not always executed.  */
 133 #ifndef PREFETCH_NOT_ALWAYS
 134 #define PREFETCH_NOT_ALWAYS 0
 135 #endif
 136
 137 /* If the loop requires more prefetches than the target can process in
 138    parallel then don't prefetch anything in that loop.  */
 139 #ifndef PREFETCH_LIMIT_TO_SIMULTANEOUS
 140 #define PREFETCH_LIMIT_TO_SIMULTANEOUS 1
 141 #endif
 142
 143 #define LOOP_REG_LIFETIME(LOOP, REGNO) \
 144 ((REGNO_LAST_LUID (REGNO) - REGNO_FIRST_LUID (REGNO)))
 145
 146 #define LOOP_REG_GLOBAL_P(LOOP, REGNO) \
 147 ((REGNO_LAST_LUID (REGNO) > INSN_LUID ((LOOP)->end) \
 148  || REGNO_FIRST_LUID (REGNO) < INSN_LUID ((LOOP)->start)))
 149
 150 #define LOOP_REGNO_NREGS(REGNO, SET_DEST) \
 151 ((REGNO) < FIRST_PSEUDO_REGISTER \
 152  ? HARD_REGNO_NREGS ((REGNO), GET_MODE (SET_DEST)) : 1)
 153
 154
 155 /* Vector mapping INSN_UIDs to luids.
 156    The luids are like uids but increase monotonically always.
 157    We use them to see whether a jump comes from outside a given loop.  */
 158
 159 int *uid_luid;
 160
 161 /* Indexed by INSN_UID, contains the ordinal giving the (innermost) loop
 162    number the insn is contained in.  */
 163
 164 struct loop **uid_loop;
 165
 166 /* 1 + largest uid of any insn.  */
 167
 168 int max_uid_for_loop;
 169
 170 /* 1 + luid of last insn.  */
 171
 172 static int max_luid;
 173
 174 /* Number of loops detected in current function.  Used as index to the
 175    next few tables.  */
 176
 177 static int max_loop_num;
 178
 179 /* Bound on pseudo register number before loop optimization.
 180    A pseudo has valid regscan info if its number is < max_reg_before_loop.  */
 181 unsigned int max_reg_before_loop;
 182
 183 /* The value to pass to the next call of reg_scan_update.  */
 184 static int loop_max_reg;
 185
 186 #define obstack_chunk_alloc xmalloc
 187 #define obstack_chunk_free free
 188 \f
 189 /* During the analysis of a loop, a chain of `struct movable's
 190    is made to record all the movable insns found.
 191    Then the entire chain can be scanned to decide which to move.  */
 192
 193 struct movable
 194 {
 195   rtx insn;                     /* A movable insn */
 196   rtx set_src;                  /* The expression this reg is set from.  */
 197   rtx set_dest;                 /* The destination of this SET.  */
 198   rtx dependencies;             /* When INSN is libcall, this is an EXPR_LIST
 199                                    of any registers used within the LIBCALL.  */
 200   int consec;                   /* Number of consecutive following insns
 201                                    that must be moved with this one.  */
 202   unsigned int regno;           /* The register it sets */
 203   short lifetime;               /* lifetime of that register;
 204                                    may be adjusted when matching movables
 205                                    that load the same value are found.  */
 206   short savings;                /* Number of insns we can move for this reg,
 207                                    including other movables that force this
 208                                    or match this one.  */
 209   unsigned int cond : 1;        /* 1 if only conditionally movable */
 210   unsigned int force : 1;       /* 1 means MUST move this insn */
 211   unsigned int global : 1;      /* 1 means reg is live outside this loop */
 212                 /* If PARTIAL is 1, GLOBAL means something different:
 213                    that the reg is live outside the range from where it is set
 214                    to the following label.  */
 215   unsigned int done : 1;        /* 1 inhibits further processing of this */
 216
 217   unsigned int partial : 1;     /* 1 means this reg is used for zero-extending.
 218                                    In particular, moving it does not make it
 219                                    invariant.  */
 220   unsigned int move_insn : 1;   /* 1 means that we call emit_move_insn to
 221                                    load SRC, rather than copying INSN.  */
 222   unsigned int move_insn_first:1;/* Same as above, if this is necessary for the
 223                                     first insn of a consecutive sets group.  */
 224   unsigned int is_equiv : 1;    /* 1 means a REG_EQUIV is present on INSN.  */
 225   enum machine_mode savemode;   /* Nonzero means it is a mode for a low part
 226                                    that we should avoid changing when clearing
 227                                    the rest of the reg.  */
 228   struct movable *match;        /* First entry for same value */
 229   struct movable *forces;       /* An insn that must be moved if this is */
 230   struct movable *next;
 231 };
 232
 233
 234 FILE *loop_dump_stream;
 235
 236 /* Forward declarations.  */
 237
 238 static void find_and_verify_loops PARAMS ((rtx, struct loops *));
 239 static void mark_loop_jump PARAMS ((rtx, struct loop *));
 240 static void prescan_loop PARAMS ((struct loop *));
 241 static int reg_in_basic_block_p PARAMS ((rtx, rtx));
 242 static int consec_sets_invariant_p PARAMS ((const struct loop *,
 243                                             rtx, int, rtx));
 244 static int labels_in_range_p PARAMS ((rtx, int));
 245 static void count_one_set PARAMS ((struct loop_regs *, rtx, rtx, rtx *));
 246 static void note_addr_stored PARAMS ((rtx, rtx, void *));
 247 static void note_set_pseudo_multiple_uses PARAMS ((rtx, rtx, void *));
 248 static int loop_reg_used_before_p PARAMS ((const struct loop *, rtx, rtx));
 249 static void scan_loop PARAMS ((struct loop*, int));
 250 #if 0
 251 static void replace_call_address PARAMS ((rtx, rtx, rtx));
 252 #endif
 253 static rtx skip_consec_insns PARAMS ((rtx, int));
 254 static int libcall_benefit PARAMS ((rtx));
 255 static void ignore_some_movables PARAMS ((struct loop_movables *));
 256 static void force_movables PARAMS ((struct loop_movables *));
 257 static void combine_movables PARAMS ((struct loop_movables *,
 258                                       struct loop_regs *));
 259 static int num_unmoved_movables PARAMS ((const struct loop *));
 260 static int regs_match_p PARAMS ((rtx, rtx, struct loop_movables *));
 261 static int rtx_equal_for_loop_p PARAMS ((rtx, rtx, struct loop_movables *,
 262                                          struct loop_regs *));
 263 static void add_label_notes PARAMS ((rtx, rtx));
 264 static void move_movables PARAMS ((struct loop *loop, struct loop_movables *,
 265                                    int, int));
 266 static void loop_movables_add PARAMS((struct loop_movables *,
 267                                       struct movable *));
 268 static void loop_movables_free PARAMS((struct loop_movables *));
 269 static int count_nonfixed_reads PARAMS ((const struct loop *, rtx));
 270 static void loop_bivs_find PARAMS((struct loop *));
 271 static void loop_bivs_init_find PARAMS((struct loop *));
 272 static void loop_bivs_check PARAMS((struct loop *));
 273 static void loop_givs_find PARAMS((struct loop *));
 274 static void loop_givs_check PARAMS((struct loop *));
 275 static int loop_biv_eliminable_p PARAMS((struct loop *, struct iv_class *,
 276                                          int, int));
 277 static int loop_giv_reduce_benefit PARAMS((struct loop *, struct iv_class *,
 278                                            struct induction *, rtx));
 279 static void loop_givs_dead_check PARAMS((struct loop *, struct iv_class *));
 280 static void loop_givs_reduce PARAMS((struct loop *, struct iv_class *));
 281 static void loop_givs_rescan PARAMS((struct loop *, struct iv_class *,
 282                                      rtx *));
 283 static void loop_ivs_free PARAMS((struct loop *));
 284 static void strength_reduce PARAMS ((struct loop *, int));
 285 static void find_single_use_in_loop PARAMS ((struct loop_regs *, rtx, rtx));
 286 static int valid_initial_value_p PARAMS ((rtx, rtx, int, rtx));
 287 static void find_mem_givs PARAMS ((const struct loop *, rtx, rtx, int, int));
 288 static void record_biv PARAMS ((struct loop *, struct induction *,
 289                                 rtx, rtx, rtx, rtx, rtx *,
 290                                 int, int));
 291 static void check_final_value PARAMS ((const struct loop *,
 292                                        struct induction *));
 293 static void loop_ivs_dump PARAMS((const struct loop *, FILE *, int));
 294 static void loop_iv_class_dump PARAMS((const struct iv_class *, FILE *, int));
 295 static void loop_biv_dump PARAMS((const struct induction *, FILE *, int));
 296 static void loop_giv_dump PARAMS((const struct induction *, FILE *, int));
 297 static void record_giv PARAMS ((const struct loop *, struct induction *,
 298                                 rtx, rtx, rtx, rtx, rtx, rtx, int,
 299                                 enum g_types, int, int, rtx *));
 300 static void update_giv_derive PARAMS ((const struct loop *, rtx));
 301 static void check_ext_dependent_givs PARAMS ((struct iv_class *,
 302                                               struct loop_info *));
 303 static int basic_induction_var PARAMS ((const struct loop *, rtx,
 304                                         enum machine_mode, rtx, rtx,
 305                                         rtx *, rtx *, rtx **));
 306 static rtx simplify_giv_expr PARAMS ((const struct loop *, rtx, rtx *, int *));
 307 static int general_induction_var PARAMS ((const struct loop *loop, rtx, rtx *,
 308                                           rtx *, rtx *, rtx *, int, int *,
 309                                           enum machine_mode));
 310 static int consec_sets_giv PARAMS ((const struct loop *, int, rtx,
 311                                     rtx, rtx, rtx *, rtx *, rtx *, rtx *));
 312 static int check_dbra_loop PARAMS ((struct loop *, int));
 313 static rtx express_from_1 PARAMS ((rtx, rtx, rtx));
 314 static rtx combine_givs_p PARAMS ((struct induction *, struct induction *));
 315 static int cmp_combine_givs_stats PARAMS ((const PTR, const PTR));
 316 static void combine_givs PARAMS ((struct loop_regs *, struct iv_class *));
 317 static int product_cheap_p PARAMS ((rtx, rtx));
 318 static int maybe_eliminate_biv PARAMS ((const struct loop *, struct iv_class *,
 319                                         int, int, int));
 320 static int maybe_eliminate_biv_1 PARAMS ((const struct loop *, rtx, rtx,
 321                                           struct iv_class *, int,
 322                                           basic_block, rtx));
 323 static int last_use_this_basic_block PARAMS ((rtx, rtx));
 324 static void record_initial PARAMS ((rtx, rtx, void *));
 325 static void update_reg_last_use PARAMS ((rtx, rtx));
 326 static rtx next_insn_in_loop PARAMS ((const struct loop *, rtx));
 327 static void loop_regs_scan PARAMS ((const struct loop *, int));
 328 static int count_insns_in_loop PARAMS ((const struct loop *));
 329 static void load_mems PARAMS ((const struct loop *));
 330 static int insert_loop_mem PARAMS ((rtx *, void *));
 331 static int replace_loop_mem PARAMS ((rtx *, void *));
 332 static void replace_loop_mems PARAMS ((rtx, rtx, rtx));
 333 static int replace_loop_reg PARAMS ((rtx *, void *));
 334 static void replace_loop_regs PARAMS ((rtx insn, rtx, rtx));
 335 static void note_reg_stored PARAMS ((rtx, rtx, void *));
 336 static void try_copy_prop PARAMS ((const struct loop *, rtx, unsigned int));
 337 static void try_swap_copy_prop PARAMS ((const struct loop *, rtx,
 338                                          unsigned int));
 339 static int replace_label PARAMS ((rtx *, void *));
 340 static rtx check_insn_for_givs PARAMS((struct loop *, rtx, int, int));
 341 static rtx check_insn_for_bivs PARAMS((struct loop *, rtx, int, int));
 342 static rtx gen_add_mult PARAMS ((rtx, rtx, rtx, rtx));
 343 static void loop_regs_update PARAMS ((const struct loop *, rtx));
 344 static int iv_add_mult_cost PARAMS ((rtx, rtx, rtx, rtx));
 345
 346 static rtx loop_insn_emit_after PARAMS((const struct loop *, basic_block,
 347                                         rtx, rtx));
 348 static rtx loop_call_insn_emit_before PARAMS((const struct loop *,
 349                                               basic_block, rtx, rtx));
 350 static rtx loop_call_insn_hoist PARAMS((const struct loop *, rtx));
 351 static rtx loop_insn_sink_or_swim PARAMS((const struct loop *, rtx));
 352
 353 static void loop_dump_aux PARAMS ((const struct loop *, FILE *, int));
 354 static void loop_delete_insns PARAMS ((rtx, rtx));
 355 static HOST_WIDE_INT remove_constant_addition PARAMS ((rtx *));
 356 void debug_ivs PARAMS ((const struct loop *));
 357 void debug_iv_class PARAMS ((const struct iv_class *));
 358 void debug_biv PARAMS ((const struct induction *));
 359 void debug_giv PARAMS ((const struct induction *));
 360 void debug_loop PARAMS ((const struct loop *));
 361 void debug_loops PARAMS ((const struct loops *));
 362
 363 typedef struct rtx_pair
 364 {
 365   rtx r1;
 366   rtx r2;
 367 } rtx_pair;
 368
 369 typedef struct loop_replace_args
 370 {
 371   rtx match;
 372   rtx replacement;
 373   rtx insn;
 374 } loop_replace_args;
 375
 376 /* Nonzero iff INSN is between START and END, inclusive.  */
 377 #define INSN_IN_RANGE_P(INSN, START, END)       \
 378   (INSN_UID (INSN) < max_uid_for_loop           \
 379    && INSN_LUID (INSN) >= INSN_LUID (START)     \
 380    && INSN_LUID (INSN) <= INSN_LUID (END))
 381
 382 /* Indirect_jump_in_function is computed once per function.  */
 383 static int indirect_jump_in_function;
 384 static int indirect_jump_in_function_p PARAMS ((rtx));
 385
 386 static int compute_luids PARAMS ((rtx, rtx, int));
 387
 388 static int biv_elimination_giv_has_0_offset PARAMS ((struct induction *,
 389                                                      struct induction *,
 390                                                      rtx));
 391 \f
 392 /* Benefit penalty, if a giv is not replaceable, i.e. must emit an insn to
 393    copy the value of the strength reduced giv to its original register.  */
 394 static int copy_cost;
 395
 396 /* Cost of using a register, to normalize the benefits of a giv.  */
 397 static int reg_address_cost;
 398
 399 void
 400 init_loop ()
 401 {
 402   rtx reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
 403
 404   reg_address_cost = address_cost (reg, SImode);
 405
 406   copy_cost = COSTS_N_INSNS (1);
 407 }
 408 \f
 409 /* Compute the mapping from uids to luids.
 410    LUIDs are numbers assigned to insns, like uids,
 411    except that luids increase monotonically through the code.
 412    Start at insn START and stop just before END.  Assign LUIDs
 413    starting with PREV_LUID + 1.  Return the last assigned LUID + 1.  */
 414 static int
 415 compute_luids (start, end, prev_luid)
 416      rtx start, end;
 417      int prev_luid;
 418 {
 419   int i;
 420   rtx insn;
 421
 422   for (insn = start, i = prev_luid; insn != end; insn = NEXT_INSN (insn))
 423     {
 424       if (INSN_UID (insn) >= max_uid_for_loop)
 425         continue;
 426       /* Don't assign luids to line-number NOTEs, so that the distance in
 427          luids between two insns is not affected by -g.  */
 428       if (GET_CODE (insn) != NOTE
 429           || NOTE_LINE_NUMBER (insn) <= 0)
 430         uid_luid[INSN_UID (insn)] = ++i;
 431       else
 432         /* Give a line number note the same luid as preceding insn.  */
 433         uid_luid[INSN_UID (insn)] = i;
 434     }
 435   return i + 1;
 436 }
 437 \f
 438 /* Entry point of this file.  Perform loop optimization
 439    on the current function.  F is the first insn of the function
 440    and DUMPFILE is a stream for output of a trace of actions taken
 441    (or 0 if none should be output).  */
 442
 443 void
 444 loop_optimize (f, dumpfile, flags)
 445      /* f is the first instruction of a chain of insns for one function */
 446      rtx f;
 447      FILE *dumpfile;
 448      int flags;
 449 {
 450   rtx insn;
 451   int i;
 452   struct loops loops_data;
 453   struct loops *loops = &loops_data;
 454   struct loop_info *loops_info;
 455
 456   loop_dump_stream = dumpfile;
 457
 458   init_recog_no_volatile ();
 459
 460   max_reg_before_loop = max_reg_num ();
 461   loop_max_reg = max_reg_before_loop;
 462
 463   regs_may_share = 0;
 464
 465   /* Count the number of loops.  */
 466
 467   max_loop_num = 0;
 468   for (insn = f; insn; insn = NEXT_INSN (insn))
 469     {
 470       if (GET_CODE (insn) == NOTE
 471           && NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
 472         max_loop_num++;
 473     }
 474
 475   /* Don't waste time if no loops.  */
 476   if (max_loop_num == 0)
 477     return;
 478
 479   loops->num = max_loop_num;
 480
 481   /* Get size to use for tables indexed by uids.
 482      Leave some space for labels allocated by find_and_verify_loops.  */
 483   max_uid_for_loop = get_max_uid () + 1 + max_loop_num * 32;
 484
 485   uid_luid = (int *) xcalloc (max_uid_for_loop, sizeof (int));
 486   uid_loop = (struct loop **) xcalloc (max_uid_for_loop,
 487                                        sizeof (struct loop *));
 488
 489   /* Allocate storage for array of loops.  */
 490   loops->array = (struct loop *)
 491     xcalloc (loops->num, sizeof (struct loop));
 492
 493   /* Find and process each loop.
 494      First, find them, and record them in order of their beginnings.  */
 495   find_and_verify_loops (f, loops);
 496
 497   /* Allocate and initialize auxiliary loop information.  */
 498   loops_info = xcalloc (loops->num, sizeof (struct loop_info));
 499   for (i = 0; i < loops->num; i++)
 500     loops->array[i].aux = loops_info + i;
 501
 502   /* Now find all register lifetimes.  This must be done after
 503      find_and_verify_loops, because it might reorder the insns in the
 504      function.  */
 505   reg_scan (f, max_reg_before_loop, 1);
 506
 507   /* This must occur after reg_scan so that registers created by gcse
 508      will have entries in the register tables.
 509
 510      We could have added a call to reg_scan after gcse_main in toplev.c,
 511      but moving this call to init_alias_analysis is more efficient.  */
 512   init_alias_analysis ();
 513
 514   /* See if we went too far.  Note that get_max_uid already returns
 515      one more that the maximum uid of all insn.  */
 516   if (get_max_uid () > max_uid_for_loop)
 517     abort ();
 518   /* Now reset it to the actual size we need.  See above.  */
 519   max_uid_for_loop = get_max_uid ();
 520
 521   /* find_and_verify_loops has already called compute_luids, but it
 522      might have rearranged code afterwards, so we need to recompute
 523      the luids now.  */
 524   max_luid = compute_luids (f, NULL_RTX, 0);
 525
 526   /* Don't leave gaps in uid_luid for insns that have been
 527      deleted.  It is possible that the first or last insn
 528      using some register has been deleted by cross-jumping.
 529      Make sure that uid_luid for that former insn's uid
 530      points to the general area where that insn used to be.  */
 531   for (i = 0; i < max_uid_for_loop; i++)
 532     {
 533       uid_luid[0] = uid_luid[i];
 534       if (uid_luid[0] != 0)
 535         break;
 536     }
 537   for (i = 0; i < max_uid_for_loop; i++)
 538     if (uid_luid[i] == 0)
 539       uid_luid[i] = uid_luid[i - 1];
 540
 541   /* Determine if the function has indirect jump.  On some systems
 542      this prevents low overhead loop instructions from being used.  */
 543   indirect_jump_in_function = indirect_jump_in_function_p (f);
 544
 545   /* Now scan the loops, last ones first, since this means inner ones are done
 546      before outer ones.  */
 547   for (i = max_loop_num - 1; i >= 0; i--)
 548     {
 549       struct loop *loop = &loops->array[i];
 550
 551       if (! loop->invalid && loop->end)
 552         scan_loop (loop, flags);
 553     }
 554
 555   /* If there were lexical blocks inside the loop, they have been
 556      replicated.  We will now have more than one NOTE_INSN_BLOCK_BEG
 557      and NOTE_INSN_BLOCK_END for each such block.  We must duplicate
 558      the BLOCKs as well.  */
 559   if (write_symbols != NO_DEBUG)
 560     reorder_blocks ();
 561
 562   end_alias_analysis ();
 563
 564   /* Clean up.  */
 565   free (uid_luid);
 566   free (uid_loop);
 567   free (loops_info);
 568   free (loops->array);
 569 }
 570 \f
 571 /* Returns the next insn, in execution order, after INSN.  START and
 572    END are the NOTE_INSN_LOOP_BEG and NOTE_INSN_LOOP_END for the loop,
 573    respectively.  LOOP->TOP, if non-NULL, is the top of the loop in the
 574    insn-stream; it is used with loops that are entered near the
 575    bottom.  */
 576
 577 static rtx
 578 next_insn_in_loop (loop, insn)
 579      const struct loop *loop;
 580      rtx insn;
 581 {
 582   insn = NEXT_INSN (insn);
 583
 584   if (insn == loop->end)
 585     {
 586       if (loop->top)
 587         /* Go to the top of the loop, and continue there.  */
 588         insn = loop->top;
 589       else
 590         /* We're done.  */
 591         insn = NULL_RTX;
 592     }
 593
 594   if (insn == loop->scan_start)
 595     /* We're done.  */
 596     insn = NULL_RTX;
 597
 598   return insn;
 599 }
 600
 601 /* Optimize one loop described by LOOP.  */
 602
 603 /* ??? Could also move memory writes out of loops if the destination address
 604    is invariant, the source is invariant, the memory write is not volatile,
 605    and if we can prove that no read inside the loop can read this address
 606    before the write occurs.  If there is a read of this address after the
 607    write, then we can also mark the memory read as invariant.  */
 608
 609 static void
 610 scan_loop (loop, flags)
 611      struct loop *loop;
 612      int flags;
 613 {
 614   struct loop_info *loop_info = LOOP_INFO (loop);
 615   struct loop_regs *regs = LOOP_REGS (loop);
 616   int i;
 617   rtx loop_start = loop->start;
 618   rtx loop_end = loop->end;
 619   rtx p;
 620   /* 1 if we are scanning insns that could be executed zero times.  */
 621   int maybe_never = 0;
 622   /* 1 if we are scanning insns that might never be executed
 623      due to a subroutine call which might exit before they are reached.  */
 624   int call_passed = 0;
 625   /* Jump insn that enters the loop, or 0 if control drops in.  */
 626   rtx loop_entry_jump = 0;
 627   /* Number of insns in the loop.  */
 628   int insn_count;
 629   int tem;
 630   rtx temp, update_start, update_end;
 631   /* The SET from an insn, if it is the only SET in the insn.  */
 632   rtx set, set1;
 633   /* Chain describing insns movable in current loop.  */
 634   struct loop_movables *movables = LOOP_MOVABLES (loop);
 635   /* Ratio of extra register life span we can justify
 636      for saving an instruction.  More if loop doesn't call subroutines
 637      since in that case saving an insn makes more difference
 638      and more registers are available.  */
 639   int threshold;
 640   /* Nonzero if we are scanning instructions in a sub-loop.  */
 641   int loop_depth = 0;
 642
 643   loop->top = 0;
 644
 645   movables->head = 0;
 646   movables->last = 0;
 647
 648   /* Determine whether this loop starts with a jump down to a test at
 649      the end.  This will occur for a small number of loops with a test
 650      that is too complex to duplicate in front of the loop.
 651
 652      We search for the first insn or label in the loop, skipping NOTEs.
 653      However, we must be careful not to skip past a NOTE_INSN_LOOP_BEG
 654      (because we might have a loop executed only once that contains a
 655      loop which starts with a jump to its exit test) or a NOTE_INSN_LOOP_END
 656      (in case we have a degenerate loop).
 657
 658      Note that if we mistakenly think that a loop is entered at the top
 659      when, in fact, it is entered at the exit test, the only effect will be
 660      slightly poorer optimization.  Making the opposite error can generate
 661      incorrect code.  Since very few loops now start with a jump to the
 662      exit test, the code here to detect that case is very conservative.  */
 663
 664   for (p = NEXT_INSN (loop_start);
 665        p != loop_end
 666          && GET_CODE (p) != CODE_LABEL && ! INSN_P (p)
 667          && (GET_CODE (p) != NOTE
 668              || (NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_BEG
 669                  && NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_END));
 670        p = NEXT_INSN (p))
 671     ;
 672
 673   loop->scan_start = p;
 674
 675   /* If loop end is the end of the current function, then emit a
 676      NOTE_INSN_DELETED after loop_end and set loop->sink to the dummy
 677      note insn.  This is the position we use when sinking insns out of
 678      the loop.  */
 679   if (NEXT_INSN (loop->end) != 0)
 680     loop->sink = NEXT_INSN (loop->end);
 681   else
 682     loop->sink = emit_note_after (NOTE_INSN_DELETED, loop->end);
 683
 684   /* Set up variables describing this loop.  */
 685   prescan_loop (loop);
 686   threshold = (loop_info->has_call ? 1 : 2) * (1 + n_non_fixed_regs);
 687
 688   /* If loop has a jump before the first label,
 689      the true entry is the target of that jump.
 690      Start scan from there.
 691      But record in LOOP->TOP the place where the end-test jumps
 692      back to so we can scan that after the end of the loop.  */
 693   if (GET_CODE (p) == JUMP_INSN)
 694     {
 695       loop_entry_jump = p;
 696
 697       /* Loop entry must be unconditional jump (and not a RETURN)  */
 698       if (any_uncondjump_p (p)
 699           && JUMP_LABEL (p) != 0
 700           /* Check to see whether the jump actually
 701              jumps out of the loop (meaning it's no loop).
 702              This case can happen for things like
 703              do {..} while (0).  If this label was generated previously
 704              by loop, we can't tell anything about it and have to reject
 705              the loop.  */
 706           && INSN_IN_RANGE_P (JUMP_LABEL (p), loop_start, loop_end))
 707         {
 708           loop->top = next_label (loop->scan_start);
 709           loop->scan_start = JUMP_LABEL (p);
 710         }
 711     }
 712
 713   /* If LOOP->SCAN_START was an insn created by loop, we don't know its luid
 714      as required by loop_reg_used_before_p.  So skip such loops.  (This
 715      test may never be true, but it's best to play it safe.)
 716
 717      Also, skip loops where we do not start scanning at a label.  This
 718      test also rejects loops starting with a JUMP_INSN that failed the
 719      test above.  */
 720
 721   if (INSN_UID (loop->scan_start) >= max_uid_for_loop
 722       || GET_CODE (loop->scan_start) != CODE_LABEL)
 723     {
 724       if (loop_dump_stream)
 725         fprintf (loop_dump_stream, "\nLoop from %d to %d is phony.\n\n",
 726                  INSN_UID (loop_start), INSN_UID (loop_end));
 727       return;
 728     }
 729
 730   /* Allocate extra space for REGs that might be created by load_mems.
 731      We allocate a little extra slop as well, in the hopes that we
 732      won't have to reallocate the regs array.  */
 733   loop_regs_scan (loop, loop_info->mems_idx + 16);
 734   insn_count = count_insns_in_loop (loop);
 735
 736   if (loop_dump_stream)
 737     {
 738       fprintf (loop_dump_stream, "\nLoop from %d to %d: %d real insns.\n",
 739                INSN_UID (loop_start), INSN_UID (loop_end), insn_count);
 740       if (loop->cont)
 741         fprintf (loop_dump_stream, "Continue at insn %d.\n",
 742                  INSN_UID (loop->cont));
 743     }
 744
 745   /* Scan through the loop finding insns that are safe to move.
 746      Set REGS->ARRAY[I].SET_IN_LOOP negative for the reg I being set, so that
 747      this reg will be considered invariant for subsequent insns.
 748      We consider whether subsequent insns use the reg
 749      in deciding whether it is worth actually moving.
 750
 751      MAYBE_NEVER is nonzero if we have passed a conditional jump insn
 752      and therefore it is possible that the insns we are scanning
 753      would never be executed.  At such times, we must make sure
 754      that it is safe to execute the insn once instead of zero times.
 755      When MAYBE_NEVER is 0, all insns will be executed at least once
 756      so that is not a problem.  */
 757
 758   for (p = next_insn_in_loop (loop, loop->scan_start);
 759        p != NULL_RTX;
 760        p = next_insn_in_loop (loop, p))
 761     {
 762       if (GET_CODE (p) == INSN
 763           && (set = single_set (p))
 764           && GET_CODE (SET_DEST (set)) == REG
 765 #ifdef PIC_OFFSET_TABLE_REG_CALL_CLOBBERED
 766           && SET_DEST (set) != pic_offset_table_rtx
 767 #endif
 768           && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
 769         {
 770           int tem1 = 0;
 771           int tem2 = 0;
 772           int move_insn = 0;
 773           rtx src = SET_SRC (set);
 774           rtx dependencies = 0;
 775
 776           /* Figure out what to use as a source of this insn.  If a REG_EQUIV
 777              note is given or if a REG_EQUAL note with a constant operand is
 778              specified, use it as the source and mark that we should move
 779              this insn by calling emit_move_insn rather that duplicating the
 780              insn.
 781
 782              Otherwise, only use the REG_EQUAL contents if a REG_RETVAL note
 783              is present.  */
 784           temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
 785           if (temp)
 786             src = XEXP (temp, 0), move_insn = 1;
 787           else
 788             {
 789               temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
 790               if (temp && CONSTANT_P (XEXP (temp, 0)))
 791                 src = XEXP (temp, 0), move_insn = 1;
 792               if (temp && find_reg_note (p, REG_RETVAL, NULL_RTX))
 793                 {
 794                   src = XEXP (temp, 0);
 795                   /* A libcall block can use regs that don't appear in
 796                      the equivalent expression.  To move the libcall,
 797                      we must move those regs too.  */
 798                   dependencies = libcall_other_reg (p, src);
 799                 }
 800             }
 801
 802           /* For parallels, add any possible uses to the depencies, as we can't move
 803              the insn without resolving them first.  */
 804           if (GET_CODE (PATTERN (p)) == PARALLEL)
 805             {
 806               for (i = 0; i < XVECLEN (PATTERN (p), 0); i++)
 807                 {
 808                   rtx x = XVECEXP (PATTERN (p), 0, i);
 809                   if (GET_CODE (x) == USE)
 810                     dependencies = gen_rtx_EXPR_LIST (VOIDmode, XEXP (x, 0), dependencies);
 811                 }
 812             }
 813
 814           /* Don't try to optimize a register that was made
 815              by loop-optimization for an inner loop.
 816              We don't know its life-span, so we can't compute the benefit.  */
 817           if (REGNO (SET_DEST (set)) >= max_reg_before_loop)
 818             ;
 819           else if (/* The register is used in basic blocks other
 820                       than the one where it is set (meaning that
 821                       something after this point in the loop might
 822                       depend on its value before the set).  */
 823                    ! reg_in_basic_block_p (p, SET_DEST (set))
 824                    /* And the set is not guaranteed to be executed once
 825                       the loop starts, or the value before the set is
 826                       needed before the set occurs...
 827
 828                       ??? Note we have quadratic behaviour here, mitigated
 829                       by the fact that the previous test will often fail for
 830                       large loops.  Rather than re-scanning the entire loop
 831                       each time for register usage, we should build tables
 832                       of the register usage and use them here instead.  */
 833                    && (maybe_never
 834                        || loop_reg_used_before_p (loop, set, p)))
 835             /* It is unsafe to move the set.
 836
 837                This code used to consider it OK to move a set of a variable
 838                which was not created by the user and not used in an exit test.
 839                That behavior is incorrect and was removed.  */
 840             ;
 841           else if ((tem = loop_invariant_p (loop, src))
 842                    && (dependencies == 0
 843                        || (tem2 = loop_invariant_p (loop, dependencies)) != 0)
 844                    && (regs->array[REGNO (SET_DEST (set))].set_in_loop == 1
 845                        || (tem1
 846                            = consec_sets_invariant_p
 847                            (loop, SET_DEST (set),
 848                             regs->array[REGNO (SET_DEST (set))].set_in_loop,
 849                             p)))
 850                    /* If the insn can cause a trap (such as divide by zero),
 851                       can't move it unless it's guaranteed to be executed
 852                       once loop is entered.  Even a function call might
 853                       prevent the trap insn from being reached
 854                       (since it might exit!)  */
 855                    && ! ((maybe_never || call_passed)
 856                          && may_trap_p (src)))
 857             {
 858               struct movable *m;
 859               int regno = REGNO (SET_DEST (set));
 860
 861               /* A potential lossage is where we have a case where two insns
 862                  can be combined as long as they are both in the loop, but
 863                  we move one of them outside the loop.  For large loops,
 864                  this can lose.  The most common case of this is the address
 865                  of a function being called.
 866
 867                  Therefore, if this register is marked as being used exactly
 868                  once if we are in a loop with calls (a "large loop"), see if
 869                  we can replace the usage of this register with the source
 870                  of this SET.  If we can, delete this insn.
 871
 872                  Don't do this if P has a REG_RETVAL note or if we have
 873                  SMALL_REGISTER_CLASSES and SET_SRC is a hard register.  */
 874
 875               if (loop_info->has_call
 876                   && regs->array[regno].single_usage != 0
 877                   && regs->array[regno].single_usage != const0_rtx
 878                   && REGNO_FIRST_UID (regno) == INSN_UID (p)
 879                   && (REGNO_LAST_UID (regno)
 880                       == INSN_UID (regs->array[regno].single_usage))
 881                   && regs->array[regno].set_in_loop == 1
 882                   && GET_CODE (SET_SRC (set)) != ASM_OPERANDS
 883                   && ! side_effects_p (SET_SRC (set))
 884                   && ! find_reg_note (p, REG_RETVAL, NULL_RTX)
 885                   && (! SMALL_REGISTER_CLASSES
 886                       || (! (GET_CODE (SET_SRC (set)) == REG
 887                              && REGNO (SET_SRC (set)) < FIRST_PSEUDO_REGISTER)))
 888                   /* This test is not redundant; SET_SRC (set) might be
 889                      a call-clobbered register and the life of REGNO
 890                      might span a call.  */
 891                   && ! modified_between_p (SET_SRC (set), p,
 892                                            regs->array[regno].single_usage)
 893                   && no_labels_between_p (p, regs->array[regno].single_usage)
 894                   && validate_replace_rtx (SET_DEST (set), SET_SRC (set),
 895                                            regs->array[regno].single_usage))
 896                 {
 897                   /* Replace any usage in a REG_EQUAL note.  Must copy the
 898                      new source, so that we don't get rtx sharing between the
 899                      SET_SOURCE and REG_NOTES of insn p.  */
 900                   REG_NOTES (regs->array[regno].single_usage)
 901                     = replace_rtx (REG_NOTES (regs->array[regno].single_usage),
 902                                    SET_DEST (set), copy_rtx (SET_SRC (set)));
 903
 904                   delete_insn (p);
 905                   for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set)); i++)
 906                     regs->array[regno+i].set_in_loop = 0;
 907                   continue;
 908                 }
 909
 910               m = (struct movable *) xmalloc (sizeof (struct movable));
 911               m->next = 0;
 912               m->insn = p;
 913               m->set_src = src;
 914               m->dependencies = dependencies;
 915               m->set_dest = SET_DEST (set);
 916               m->force = 0;
 917               m->consec = regs->array[REGNO (SET_DEST (set))].set_in_loop - 1;
 918               m->done = 0;
 919               m->forces = 0;
 920               m->partial = 0;
 921               m->move_insn = move_insn;
 922               m->move_insn_first = 0;
 923               m->is_equiv = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
 924               m->savemode = VOIDmode;
 925               m->regno = regno;
 926               /* Set M->cond if either loop_invariant_p
 927                  or consec_sets_invariant_p returned 2
 928                  (only conditionally invariant).  */
 929               m->cond = ((tem | tem1 | tem2) > 1);
 930               m->global =  LOOP_REG_GLOBAL_P (loop, regno);
 931               m->match = 0;
 932               m->lifetime = LOOP_REG_LIFETIME (loop, regno);
 933               m->savings = regs->array[regno].n_times_set;
 934               if (find_reg_note (p, REG_RETVAL, NULL_RTX))
 935                 m->savings += libcall_benefit (p);
 936               for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set)); i++)
 937                 regs->array[regno+i].set_in_loop = move_insn ? -2 : -1;
 938               /* Add M to the end of the chain MOVABLES.  */
 939               loop_movables_add (movables, m);
 940
 941               if (m->consec > 0)
 942                 {
 943                   /* It is possible for the first instruction to have a
 944                      REG_EQUAL note but a non-invariant SET_SRC, so we must
 945                      remember the status of the first instruction in case
 946                      the last instruction doesn't have a REG_EQUAL note.  */
 947                   m->move_insn_first = m->move_insn;
 948
 949                   /* Skip this insn, not checking REG_LIBCALL notes.  */
 950                   p = next_nonnote_insn (p);
 951                   /* Skip the consecutive insns, if there are any.  */
 952                   p = skip_consec_insns (p, m->consec);
 953                   /* Back up to the last insn of the consecutive group.  */
 954                   p = prev_nonnote_insn (p);
 955
 956                   /* We must now reset m->move_insn, m->is_equiv, and possibly
 957                      m->set_src to correspond to the effects of all the
 958                      insns.  */
 959                   temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
 960                   if (temp)
 961                     m->set_src = XEXP (temp, 0), m->move_insn = 1;
 962                   else
 963                     {
 964                       temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
 965                       if (temp && CONSTANT_P (XEXP (temp, 0)))
 966                         m->set_src = XEXP (temp, 0), m->move_insn = 1;
 967                       else
 968                         m->move_insn = 0;
 969
 970                     }
 971                   m->is_equiv = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
 972                 }
 973             }
 974           /* If this register is always set within a STRICT_LOW_PART
 975              or set to zero, then its high bytes are constant.
 976              So clear them outside the loop and within the loop
 977              just load the low bytes.
 978              We must check that the machine has an instruction to do so.
 979              Also, if the value loaded into the register
 980              depends on the same register, this cannot be done.  */
 981           else if (SET_SRC (set) == const0_rtx
 982                    && GET_CODE (NEXT_INSN (p)) == INSN
 983                    && (set1 = single_set (NEXT_INSN (p)))
 984                    && GET_CODE (set1) == SET
 985                    && (GET_CODE (SET_DEST (set1)) == STRICT_LOW_PART)
 986                    && (GET_CODE (XEXP (SET_DEST (set1), 0)) == SUBREG)
 987                    && (SUBREG_REG (XEXP (SET_DEST (set1), 0))
 988                        == SET_DEST (set))
 989                    && !reg_mentioned_p (SET_DEST (set), SET_SRC (set1)))
 990             {
 991               int regno = REGNO (SET_DEST (set));
 992               if (regs->array[regno].set_in_loop == 2)
 993                 {
 994                   struct movable *m;
 995                   m = (struct movable *) xmalloc (sizeof (struct movable));
 996                   m->next = 0;
 997                   m->insn = p;
 998                   m->set_dest = SET_DEST (set);
 999                   m->dependencies = 0;
1000                   m->force = 0;
1001                   m->consec = 0;
1002                   m->done = 0;
1003                   m->forces = 0;
1004                   m->move_insn = 0;
1005                   m->move_insn_first = 0;
1006                   m->partial = 1;
1007                   /* If the insn may not be executed on some cycles,
1008                      we can't clear the whole reg; clear just high part.
1009                      Not even if the reg is used only within this loop.
1010                      Consider this:
1011                      while (1)
1012                        while (s != t) {
1013                          if (foo ()) x = *s;
1014                          use (x);
1015                        }
1016                      Clearing x before the inner loop could clobber a value
1017                      being saved from the last time around the outer loop.
1018                      However, if the reg is not used outside this loop
1019                      and all uses of the register are in the same
1020                      basic block as the store, there is no problem.
1021
1022                      If this insn was made by loop, we don't know its
1023                      INSN_LUID and hence must make a conservative
1024                      assumption.  */
1025                   m->global = (INSN_UID (p) >= max_uid_for_loop
1026                                || LOOP_REG_GLOBAL_P (loop, regno)
1027                                || (labels_in_range_p
1028                                    (p, REGNO_FIRST_LUID (regno))));
1029                   if (maybe_never && m->global)
1030                     m->savemode = GET_MODE (SET_SRC (set1));
1031                   else
1032                     m->savemode = VOIDmode;
1033                   m->regno = regno;
1034                   m->cond = 0;
1035                   m->match = 0;
1036                   m->lifetime = LOOP_REG_LIFETIME (loop, regno);
1037                   m->savings = 1;
1038                   for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set)); i++)
1039                     regs->array[regno+i].set_in_loop = -1;
1040                   /* Add M to the end of the chain MOVABLES.  */
1041                   loop_movables_add (movables, m);
1042                 }
1043             }
1044         }
1045       /* Past a call insn, we get to insns which might not be executed
1046          because the call might exit.  This matters for insns that trap.
1047          Constant and pure call insns always return, so they don't count.  */
1048       else if (GET_CODE (p) == CALL_INSN && ! CONST_OR_PURE_CALL_P (p))
1049         call_passed = 1;
1050       /* Past a label or a jump, we get to insns for which we
1051          can't count on whether or how many times they will be
1052          executed during each iteration.  Therefore, we can
1053          only move out sets of trivial variables
1054          (those not used after the loop).  */
1055       /* Similar code appears twice in strength_reduce.  */
1056       else if ((GET_CODE (p) == CODE_LABEL || GET_CODE (p) == JUMP_INSN)
1057                /* If we enter the loop in the middle, and scan around to the
1058                   beginning, don't set maybe_never for that.  This must be an
1059                   unconditional jump, otherwise the code at the top of the
1060                   loop might never be executed.  Unconditional jumps are
1061                   followed by a barrier then the loop_end.  */
1062                && ! (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p) == loop->top
1063                      && NEXT_INSN (NEXT_INSN (p)) == loop_end
1064                      && any_uncondjump_p (p)))
1065         maybe_never = 1;
1066       else if (GET_CODE (p) == NOTE)
1067         {
1068           /* At the virtual top of a converted loop, insns are again known to
1069              be executed: logically, the loop begins here even though the exit
1070              code has been duplicated.  */
1071           if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_VTOP && loop_depth == 0)
1072             maybe_never = call_passed = 0;
1073           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
1074             loop_depth++;
1075           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
1076             loop_depth--;
1077         }
1078     }
1079
1080   /* If one movable subsumes another, ignore that other.  */
1081
1082   ignore_some_movables (movables);
1083
1084   /* For each movable insn, see if the reg that it loads
1085      leads when it dies right into another conditionally movable insn.
1086      If so, record that the second insn "forces" the first one,
1087      since the second can be moved only if the first is.  */
1088
1089   force_movables (movables);
1090
1091   /* See if there are multiple movable insns that load the same value.
1092      If there are, make all but the first point at the first one
1093      through the `match' field, and add the priorities of them
1094      all together as the priority of the first.  */
1095
1096   combine_movables (movables, regs);
1097
1098   /* Now consider each movable insn to decide whether it is worth moving.
1099      Store 0 in regs->array[I].set_in_loop for each reg I that is moved.
1100
1101      Generally this increases code size, so do not move moveables when
1102      optimizing for code size.  */
1103
1104   if (! optimize_size)
1105     {
1106       move_movables (loop, movables, threshold, insn_count);
1107
1108       /* Recalculate regs->array if move_movables has created new
1109          registers.  */
1110       if (max_reg_num () > regs->num)
1111         {
1112           loop_regs_scan (loop, 0);
1113           for (update_start = loop_start;
1114                PREV_INSN (update_start)
1115                && GET_CODE (PREV_INSN (update_start)) != CODE_LABEL;
1116                update_start = PREV_INSN (update_start))
1117             ;
1118           update_end = NEXT_INSN (loop_end);
1119
1120           reg_scan_update (update_start, update_end, loop_max_reg);
1121           loop_max_reg = max_reg_num ();
1122         }
1123     }
1124
1125   /* Now candidates that still are negative are those not moved.
1126      Change regs->array[I].set_in_loop to indicate that those are not actually
1127      invariant.  */
1128   for (i = 0; i < regs->num; i++)
1129     if (regs->array[i].set_in_loop < 0)
1130       regs->array[i].set_in_loop = regs->array[i].n_times_set;
1131
1132   /* Now that we've moved some things out of the loop, we might be able to
1133      hoist even more memory references.  */
1134   load_mems (loop);
1135
1136   /* Recalculate regs->array if load_mems has created new registers.  */
1137   if (max_reg_num () > regs->num)
1138     loop_regs_scan (loop, 0);
1139
1140   for (update_start = loop_start;
1141        PREV_INSN (update_start)
1142          && GET_CODE (PREV_INSN (update_start)) != CODE_LABEL;
1143        update_start = PREV_INSN (update_start))
1144     ;
1145   update_end = NEXT_INSN (loop_end);
1146
1147   reg_scan_update (update_start, update_end, loop_max_reg);
1148   loop_max_reg = max_reg_num ();
1149
1150   if (flag_strength_reduce)
1151     {
1152       if (update_end && GET_CODE (update_end) == CODE_LABEL)
1153         /* Ensure our label doesn't go away.  */
1154         LABEL_NUSES (update_end)++;
1155
1156       strength_reduce (loop, flags);
1157
1158       reg_scan_update (update_start, update_end, loop_max_reg);
1159       loop_max_reg = max_reg_num ();
1160
1161       if (update_end && GET_CODE (update_end) == CODE_LABEL
1162           && --LABEL_NUSES (update_end) == 0)
1163         delete_related_insns (update_end);
1164     }
1165
1166
1167   /* The movable information is required for strength reduction.  */
1168   loop_movables_free (movables);
1169
1170   free (regs->array);
1171   regs->array = 0;
1172   regs->num = 0;
1173 }
1174 \f
1175 /* Add elements to *OUTPUT to record all the pseudo-regs
1176    mentioned in IN_THIS but not mentioned in NOT_IN_THIS.  */
1177
1178 void
1179 record_excess_regs (in_this, not_in_this, output)
1180      rtx in_this, not_in_this;
1181      rtx *output;
1182 {
1183   enum rtx_code code;
1184   const char *fmt;
1185   int i;
1186
1187   code = GET_CODE (in_this);
1188
1189   switch (code)
1190     {
1191     case PC:
1192     case CC0:
1193     case CONST_INT:
1194     case CONST_DOUBLE:
1195     case CONST:
1196     case SYMBOL_REF:
1197     case LABEL_REF:
1198       return;
1199
1200     case REG:
1201       if (REGNO (in_this) >= FIRST_PSEUDO_REGISTER
1202           && ! reg_mentioned_p (in_this, not_in_this))
1203         *output = gen_rtx_EXPR_LIST (VOIDmode, in_this, *output);
1204       return;
1205
1206     default:
1207       break;
1208     }
1209
1210   fmt = GET_RTX_FORMAT (code);
1211   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1212     {
1213       int j;
1214
1215       switch (fmt[i])
1216         {
1217         case 'E':
1218           for (j = 0; j < XVECLEN (in_this, i); j++)
1219             record_excess_regs (XVECEXP (in_this, i, j), not_in_this, output);
1220           break;
1221
1222         case 'e':
1223           record_excess_regs (XEXP (in_this, i), not_in_this, output);
1224           break;
1225         }
1226     }
1227 }
1228 \f
1229 /* Check what regs are referred to in the libcall block ending with INSN,
1230    aside from those mentioned in the equivalent value.
1231    If there are none, return 0.
1232    If there are one or more, return an EXPR_LIST containing all of them.  */
1233
1234 rtx
1235 libcall_other_reg (insn, equiv)
1236      rtx insn, equiv;
1237 {
1238   rtx note = find_reg_note (insn, REG_RETVAL, NULL_RTX);
1239   rtx p = XEXP (note, 0);
1240   rtx output = 0;
1241
1242   /* First, find all the regs used in the libcall block
1243      that are not mentioned as inputs to the result.  */
1244
1245   while (p != insn)
1246     {
1247       if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
1248           || GET_CODE (p) == CALL_INSN)
1249         record_excess_regs (PATTERN (p), equiv, &output);
1250       p = NEXT_INSN (p);
1251     }
1252
1253   return output;
1254 }
1255 \f
1256 /* Return 1 if all uses of REG
1257    are between INSN and the end of the basic block.  */
1258
1259 static int
1260 reg_in_basic_block_p (insn, reg)
1261      rtx insn, reg;
1262 {
1263   int regno = REGNO (reg);
1264   rtx p;
1265
1266   if (REGNO_FIRST_UID (regno) != INSN_UID (insn))
1267     return 0;
1268
1269   /* Search this basic block for the already recorded last use of the reg.  */
1270   for (p = insn; p; p = NEXT_INSN (p))
1271     {
1272       switch (GET_CODE (p))
1273         {
1274         case NOTE:
1275           break;
1276
1277         case INSN:
1278         case CALL_INSN:
1279           /* Ordinary insn: if this is the last use, we win.  */
1280           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1281             return 1;
1282           break;
1283
1284         case JUMP_INSN:
1285           /* Jump insn: if this is the last use, we win.  */
1286           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1287             return 1;
1288           /* Otherwise, it's the end of the basic block, so we lose.  */
1289           return 0;
1290
1291         case CODE_LABEL:
1292         case BARRIER:
1293           /* It's the end of the basic block, so we lose.  */
1294           return 0;
1295
1296         default:
1297           break;
1298         }
1299     }
1300
1301   /* The "last use" that was recorded can't be found after the first
1302      use.  This can happen when the last use was deleted while
1303      processing an inner loop, this inner loop was then completely
1304      unrolled, and the outer loop is always exited after the inner loop,
1305      so that everything after the first use becomes a single basic block.  */
1306   return 1;
1307 }
1308 \f
1309 /* Compute the benefit of eliminating the insns in the block whose
1310    last insn is LAST.  This may be a group of insns used to compute a
1311    value directly or can contain a library call.  */
1312
1313 static int
1314 libcall_benefit (last)
1315      rtx last;
1316 {
1317   rtx insn;
1318   int benefit = 0;
1319
1320   for (insn = XEXP (find_reg_note (last, REG_RETVAL, NULL_RTX), 0);
1321        insn != last; insn = NEXT_INSN (insn))
1322     {
1323       if (GET_CODE (insn) == CALL_INSN)
1324         benefit += 10;          /* Assume at least this many insns in a library
1325                                    routine.  */
1326       else if (GET_CODE (insn) == INSN
1327                && GET_CODE (PATTERN (insn)) != USE
1328                && GET_CODE (PATTERN (insn)) != CLOBBER)
1329         benefit++;
1330     }
1331
1332   return benefit;
1333 }
1334 \f
1335 /* Skip COUNT insns from INSN, counting library calls as 1 insn.  */
1336
1337 static rtx
1338 skip_consec_insns (insn, count)
1339      rtx insn;
1340      int count;
1341 {
1342   for (; count > 0; count--)
1343     {
1344       rtx temp;
1345
1346       /* If first insn of libcall sequence, skip to end.  */
1347       /* Do this at start of loop, since INSN is guaranteed to
1348          be an insn here.  */
1349       if (GET_CODE (insn) != NOTE
1350           && (temp = find_reg_note (insn, REG_LIBCALL, NULL_RTX)))
1351         insn = XEXP (temp, 0);
1352
1353       do
1354         insn = NEXT_INSN (insn);
1355       while (GET_CODE (insn) == NOTE);
1356     }
1357
1358   return insn;
1359 }
1360
1361 /* Ignore any movable whose insn falls within a libcall
1362    which is part of another movable.
1363    We make use of the fact that the movable for the libcall value
1364    was made later and so appears later on the chain.  */
1365
1366 static void
1367 ignore_some_movables (movables)
1368      struct loop_movables *movables;
1369 {
1370   struct movable *m, *m1;
1371
1372   for (m = movables->head; m; m = m->next)
1373     {
1374       /* Is this a movable for the value of a libcall?  */
1375       rtx note = find_reg_note (m->insn, REG_RETVAL, NULL_RTX);
1376       if (note)
1377         {
1378           rtx insn;
1379           /* Check for earlier movables inside that range,
1380              and mark them invalid.  We cannot use LUIDs here because
1381              insns created by loop.c for prior loops don't have LUIDs.
1382              Rather than reject all such insns from movables, we just
1383              explicitly check each insn in the libcall (since invariant
1384              libcalls aren't that common).  */
1385           for (insn = XEXP (note, 0); insn != m->insn; insn = NEXT_INSN (insn))
1386             for (m1 = movables->head; m1 != m; m1 = m1->next)
1387               if (m1->insn == insn)
1388                 m1->done = 1;
1389         }
1390     }
1391 }
1392
1393 /* For each movable insn, see if the reg that it loads
1394    leads when it dies right into another conditionally movable insn.
1395    If so, record that the second insn "forces" the first one,
1396    since the second can be moved only if the first is.  */
1397
1398 static void
1399 force_movables (movables)
1400      struct loop_movables *movables;
1401 {
1402   struct movable *m, *m1;
1403
1404   for (m1 = movables->head; m1; m1 = m1->next)
1405     /* Omit this if moving just the (SET (REG) 0) of a zero-extend.  */
1406     if (!m1->partial && !m1->done)
1407       {
1408         int regno = m1->regno;
1409         for (m = m1->next; m; m = m->next)
1410           /* ??? Could this be a bug?  What if CSE caused the
1411              register of M1 to be used after this insn?
1412              Since CSE does not update regno_last_uid,
1413              this insn M->insn might not be where it dies.
1414              But very likely this doesn't matter; what matters is
1415              that M's reg is computed from M1's reg.  */
1416           if (INSN_UID (m->insn) == REGNO_LAST_UID (regno)
1417               && !m->done)
1418             break;
1419         if (m != 0 && m->set_src == m1->set_dest
1420             /* If m->consec, m->set_src isn't valid.  */
1421             && m->consec == 0)
1422           m = 0;
1423
1424         /* Increase the priority of the moving the first insn
1425            since it permits the second to be moved as well.  */
1426         if (m != 0)
1427           {
1428             m->forces = m1;
1429             m1->lifetime += m->lifetime;
1430             m1->savings += m->savings;
1431           }
1432       }
1433 }
1434 \f
1435 /* Find invariant expressions that are equal and can be combined into
1436    one register.  */
1437
1438 static void
1439 combine_movables (movables, regs)
1440      struct loop_movables *movables;
1441      struct loop_regs *regs;
1442 {
1443   struct movable *m;
1444   char *matched_regs = (char *) xmalloc (regs->num);
1445   enum machine_mode mode;
1446
1447   /* Regs that are set more than once are not allowed to match
1448      or be matched.  I'm no longer sure why not.  */
1449   /* Perhaps testing m->consec_sets would be more appropriate here?  */
1450
1451   for (m = movables->head; m; m = m->next)
1452     if (m->match == 0 && regs->array[m->regno].n_times_set == 1
1453         && !m->partial)
1454       {
1455         struct movable *m1;
1456         int regno = m->regno;
1457
1458         memset (matched_regs, 0, regs->num);
1459         matched_regs[regno] = 1;
1460
1461         /* We want later insns to match the first one.  Don't make the first
1462            one match any later ones.  So start this loop at m->next.  */
1463         for (m1 = m->next; m1; m1 = m1->next)
1464           /* ??? HACK!  move_movables does not verify that the replacement
1465              is valid, which can have disasterous effects with hard regs
1466              and match_dup.  Turn combination off for now.  */
1467           if (0 && m != m1 && m1->match == 0
1468               && regs->array[m1->regno].n_times_set == 1
1469               /* A reg used outside the loop mustn't be eliminated.  */
1470               && !m1->global
1471               /* A reg used for zero-extending mustn't be eliminated.  */
1472               && !m1->partial
1473               && (matched_regs[m1->regno]
1474                   ||
1475                   (
1476                    /* Can combine regs with different modes loaded from the
1477                       same constant only if the modes are the same or
1478                       if both are integer modes with M wider or the same
1479                       width as M1.  The check for integer is redundant, but
1480                       safe, since the only case of differing destination
1481                       modes with equal sources is when both sources are
1482                       VOIDmode, i.e., CONST_INT.  */
1483                    (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest)
1484                     || (GET_MODE_CLASS (GET_MODE (m->set_dest)) == MODE_INT
1485                         && GET_MODE_CLASS (GET_MODE (m1->set_dest)) == MODE_INT
1486                         && (GET_MODE_BITSIZE (GET_MODE (m->set_dest))
1487                             >= GET_MODE_BITSIZE (GET_MODE (m1->set_dest)))))
1488                    /* See if the source of M1 says it matches M.  */
1489                    && ((GET_CODE (m1->set_src) == REG
1490                         && matched_regs[REGNO (m1->set_src)])
1491                        || rtx_equal_for_loop_p (m->set_src, m1->set_src,
1492                                                 movables, regs))))
1493               && ((m->dependencies == m1->dependencies)
1494                   || rtx_equal_p (m->dependencies, m1->dependencies)))
1495             {
1496               m->lifetime += m1->lifetime;
1497               m->savings += m1->savings;
1498               m1->done = 1;
1499               m1->match = m;
1500               matched_regs[m1->regno] = 1;
1501             }
1502       }
1503
1504   /* Now combine the regs used for zero-extension.
1505      This can be done for those not marked `global'
1506      provided their lives don't overlap.  */
1507
1508   for (mode = GET_CLASS_NARROWEST_MODE (MODE_INT); mode != VOIDmode;
1509        mode = GET_MODE_WIDER_MODE (mode))
1510     {
1511       struct movable *m0 = 0;
1512
1513       /* Combine all the registers for extension from mode MODE.
1514          Don't combine any that are used outside this loop.  */
1515       for (m = movables->head; m; m = m->next)
1516         if (m->partial && ! m->global
1517             && mode == GET_MODE (SET_SRC (PATTERN (NEXT_INSN (m->insn)))))
1518           {
1519             struct movable *m1;
1520
1521             int first = REGNO_FIRST_LUID (m->regno);
1522             int last = REGNO_LAST_LUID (m->regno);
1523
1524             if (m0 == 0)
1525               {
1526                 /* First one: don't check for overlap, just record it.  */
1527                 m0 = m;
1528                 continue;
1529               }
1530
1531             /* Make sure they extend to the same mode.
1532                (Almost always true.)  */
1533             if (GET_MODE (m->set_dest) != GET_MODE (m0->set_dest))
1534               continue;
1535
1536             /* We already have one: check for overlap with those
1537                already combined together.  */
1538             for (m1 = movables->head; m1 != m; m1 = m1->next)
1539               if (m1 == m0 || (m1->partial && m1->match == m0))
1540                 if (! (REGNO_FIRST_LUID (m1->regno) > last
1541                        || REGNO_LAST_LUID (m1->regno) < first))
1542                   goto overlap;
1543
1544             /* No overlap: we can combine this with the others.  */
1545             m0->lifetime += m->lifetime;
1546             m0->savings += m->savings;
1547             m->done = 1;
1548             m->match = m0;
1549
1550           overlap:
1551             ;
1552           }
1553     }
1554
1555   /* Clean up.  */
1556   free (matched_regs);
1557 }
1558
1559 /* Returns the number of movable instructions in LOOP that were not
1560    moved outside the loop.  */
1561
1562 static int
1563 num_unmoved_movables (loop)
1564      const struct loop *loop;
1565 {
1566   int num = 0;
1567   struct movable *m;
1568
1569   for (m = LOOP_MOVABLES (loop)->head; m; m = m->next)
1570     if (!m->done)
1571       ++num;
1572
1573   return num;
1574 }
1575
1576 \f
1577 /* Return 1 if regs X and Y will become the same if moved.  */
1578
1579 static int
1580 regs_match_p (x, y, movables)
1581      rtx x, y;
1582      struct loop_movables *movables;
1583 {
1584   unsigned int xn = REGNO (x);
1585   unsigned int yn = REGNO (y);
1586   struct movable *mx, *my;
1587
1588   for (mx = movables->head; mx; mx = mx->next)
1589     if (mx->regno == xn)
1590       break;
1591
1592   for (my = movables->head; my; my = my->next)
1593     if (my->regno == yn)
1594       break;
1595
1596   return (mx && my
1597           && ((mx->match == my->match && mx->match != 0)
1598               || mx->match == my
1599               || mx == my->match));
1600 }
1601
1602 /* Return 1 if X and Y are identical-looking rtx's.
1603    This is the Lisp function EQUAL for rtx arguments.
1604
1605    If two registers are matching movables or a movable register and an
1606    equivalent constant, consider them equal.  */
1607
1608 static int
1609 rtx_equal_for_loop_p (x, y, movables, regs)
1610      rtx x, y;
1611      struct loop_movables *movables;
1612      struct loop_regs *regs;
1613 {
1614   int i;
1615   int j;
1616   struct movable *m;
1617   enum rtx_code code;
1618   const char *fmt;
1619
1620   if (x == y)
1621     return 1;
1622   if (x == 0 || y == 0)
1623     return 0;
1624
1625   code = GET_CODE (x);
1626
1627   /* If we have a register and a constant, they may sometimes be
1628      equal.  */
1629   if (GET_CODE (x) == REG && regs->array[REGNO (x)].set_in_loop == -2
1630       && CONSTANT_P (y))
1631     {
1632       for (m = movables->head; m; m = m->next)
1633         if (m->move_insn && m->regno == REGNO (x)
1634             && rtx_equal_p (m->set_src, y))
1635           return 1;
1636     }
1637   else if (GET_CODE (y) == REG && regs->array[REGNO (y)].set_in_loop == -2
1638            && CONSTANT_P (x))
1639     {
1640       for (m = movables->head; m; m = m->next)
1641         if (m->move_insn && m->regno == REGNO (y)
1642             && rtx_equal_p (m->set_src, x))
1643           return 1;
1644     }
1645
1646   /* Otherwise, rtx's of different codes cannot be equal.  */
1647   if (code != GET_CODE (y))
1648     return 0;
1649
1650   /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.
1651      (REG:SI x) and (REG:HI x) are NOT equivalent.  */
1652
1653   if (GET_MODE (x) != GET_MODE (y))
1654     return 0;
1655
1656   /* These three types of rtx's can be compared nonrecursively.  */
1657   if (code == REG)
1658     return (REGNO (x) == REGNO (y) || regs_match_p (x, y, movables));
1659
1660   if (code == LABEL_REF)
1661     return XEXP (x, 0) == XEXP (y, 0);
1662   if (code == SYMBOL_REF)
1663     return XSTR (x, 0) == XSTR (y, 0);
1664
1665   /* Compare the elements.  If any pair of corresponding elements
1666      fail to match, return 0 for the whole things.  */
1667
1668   fmt = GET_RTX_FORMAT (code);
1669   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1670     {
1671       switch (fmt[i])
1672         {
1673         case 'w':
1674           if (XWINT (x, i) != XWINT (y, i))
1675             return 0;
1676           break;
1677
1678         case 'i':
1679           if (XINT (x, i) != XINT (y, i))
1680             return 0;
1681           break;
1682
1683         case 'E':
1684           /* Two vectors must have the same length.  */
1685           if (XVECLEN (x, i) != XVECLEN (y, i))
1686             return 0;
1687
1688           /* And the corresponding elements must match.  */
1689           for (j = 0; j < XVECLEN (x, i); j++)
1690             if (rtx_equal_for_loop_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
1691                                       movables, regs) == 0)
1692               return 0;
1693           break;
1694
1695         case 'e':
1696           if (rtx_equal_for_loop_p (XEXP (x, i), XEXP (y, i), movables, regs)
1697               == 0)
1698             return 0;
1699           break;
1700
1701         case 's':
1702           if (strcmp (XSTR (x, i), XSTR (y, i)))
1703             return 0;
1704           break;
1705
1706         case 'u':
1707           /* These are just backpointers, so they don't matter.  */
1708           break;
1709
1710         case '0':
1711           break;
1712
1713           /* It is believed that rtx's at this level will never
1714              contain anything but integers and other rtx's,
1715              except for within LABEL_REFs and SYMBOL_REFs.  */
1716         default:
1717           abort ();
1718         }
1719     }
1720   return 1;
1721 }
1722 \f
1723 /* If X contains any LABEL_REF's, add REG_LABEL notes for them to all
1724    insns in INSNS which use the reference.  LABEL_NUSES for CODE_LABEL
1725    references is incremented once for each added note.  */
1726
1727 static void
1728 add_label_notes (x, insns)
1729      rtx x;
1730      rtx insns;
1731 {
1732   enum rtx_code code = GET_CODE (x);
1733   int i, j;
1734   const char *fmt;
1735   rtx insn;
1736
1737   if (code == LABEL_REF && !LABEL_REF_NONLOCAL_P (x))
1738     {
1739       /* This code used to ignore labels that referred to dispatch tables to
1740          avoid flow generating (slighly) worse code.
1741
1742          We no longer ignore such label references (see LABEL_REF handling in
1743          mark_jump_label for additional information).  */
1744       for (insn = insns; insn; insn = NEXT_INSN (insn))
1745         if (reg_mentioned_p (XEXP (x, 0), insn))
1746           {
1747             REG_NOTES (insn) = gen_rtx_INSN_LIST (REG_LABEL, XEXP (x, 0),
1748                                                   REG_NOTES (insn));
1749             if (LABEL_P (XEXP (x, 0)))
1750               LABEL_NUSES (XEXP (x, 0))++;
1751           }
1752     }
1753
1754   fmt = GET_RTX_FORMAT (code);
1755   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1756     {
1757       if (fmt[i] == 'e')
1758         add_label_notes (XEXP (x, i), insns);
1759       else if (fmt[i] == 'E')
1760         for (j = XVECLEN (x, i) - 1; j >= 0; j--)
1761           add_label_notes (XVECEXP (x, i, j), insns);
1762     }
1763 }
1764 \f
1765 /* Scan MOVABLES, and move the insns that deserve to be moved.
1766    If two matching movables are combined, replace one reg with the
1767    other throughout.  */
1768
1769 static void
1770 move_movables (loop, movables, threshold, insn_count)
1771      struct loop *loop;
1772      struct loop_movables *movables;
1773      int threshold;
1774      int insn_count;
1775 {
1776   struct loop_regs *regs = LOOP_REGS (loop);
1777   int nregs = regs->num;
1778   rtx new_start = 0;
1779   struct movable *m;
1780   rtx p;
1781   rtx loop_start = loop->start;
1782   rtx loop_end = loop->end;
1783   /* Map of pseudo-register replacements to handle combining
1784      when we move several insns that load the same value
1785      into different pseudo-registers.  */
1786   rtx *reg_map = (rtx *) xcalloc (nregs, sizeof (rtx));
1787   char *already_moved = (char *) xcalloc (nregs, sizeof (char));
1788
1789   for (m = movables->head; m; m = m->next)
1790     {
1791       /* Describe this movable insn.  */
1792
1793       if (loop_dump_stream)
1794         {
1795           fprintf (loop_dump_stream, "Insn %d: regno %d (life %d), ",
1796                    INSN_UID (m->insn), m->regno, m->lifetime);
1797           if (m->consec > 0)
1798             fprintf (loop_dump_stream, "consec %d, ", m->consec);
1799           if (m->cond)
1800             fprintf (loop_dump_stream, "cond ");
1801           if (m->force)
1802             fprintf (loop_dump_stream, "force ");
1803           if (m->global)
1804             fprintf (loop_dump_stream, "global ");
1805           if (m->done)
1806             fprintf (loop_dump_stream, "done ");
1807           if (m->move_insn)
1808             fprintf (loop_dump_stream, "move-insn ");
1809           if (m->match)
1810             fprintf (loop_dump_stream, "matches %d ",
1811                      INSN_UID (m->match->insn));
1812           if (m->forces)
1813             fprintf (loop_dump_stream, "forces %d ",
1814                      INSN_UID (m->forces->insn));
1815         }
1816
1817       /* Ignore the insn if it's already done (it matched something else).
1818          Otherwise, see if it is now safe to move.  */
1819
1820       if (!m->done
1821           && (! m->cond
1822               || (1 == loop_invariant_p (loop, m->set_src)
1823                   && (m->dependencies == 0
1824                       || 1 == loop_invariant_p (loop, m->dependencies))
1825                   && (m->consec == 0
1826                       || 1 == consec_sets_invariant_p (loop, m->set_dest,
1827                                                        m->consec + 1,
1828                                                        m->insn))))
1829           && (! m->forces || m->forces->done))
1830         {
1831           int regno;
1832           rtx p;
1833           int savings = m->savings;
1834
1835           /* We have an insn that is safe to move.
1836              Compute its desirability.  */
1837
1838           p = m->insn;
1839           regno = m->regno;
1840
1841           if (loop_dump_stream)
1842             fprintf (loop_dump_stream, "savings %d ", savings);
1843
1844           if (regs->array[regno].moved_once && loop_dump_stream)
1845             fprintf (loop_dump_stream, "halved since already moved ");
1846
1847           /* An insn MUST be moved if we already moved something else
1848              which is safe only if this one is moved too: that is,
1849              if already_moved[REGNO] is nonzero.  */
1850
1851           /* An insn is desirable to move if the new lifetime of the
1852              register is no more than THRESHOLD times the old lifetime.
1853              If it's not desirable, it means the loop is so big
1854              that moving won't speed things up much,
1855              and it is liable to make register usage worse.  */
1856
1857           /* It is also desirable to move if it can be moved at no
1858              extra cost because something else was already moved.  */
1859
1860           if (already_moved[regno]
1861               || flag_move_all_movables
1862               || (threshold * savings * m->lifetime) >=
1863                  (regs->array[regno].moved_once ? insn_count * 2 : insn_count)
1864               || (m->forces && m->forces->done
1865                   && regs->array[m->forces->regno].n_times_set == 1))
1866             {
1867               int count;
1868               struct movable *m1;
1869               rtx first = NULL_RTX;
1870
1871               /* Now move the insns that set the reg.  */
1872
1873               if (m->partial && m->match)
1874                 {
1875                   rtx newpat, i1;
1876                   rtx r1, r2;
1877                   /* Find the end of this chain of matching regs.
1878                      Thus, we load each reg in the chain from that one reg.
1879                      And that reg is loaded with 0 directly,
1880                      since it has ->match == 0.  */
1881                   for (m1 = m; m1->match; m1 = m1->match);
1882                   newpat = gen_move_insn (SET_DEST (PATTERN (m->insn)),
1883                                           SET_DEST (PATTERN (m1->insn)));
1884                   i1 = loop_insn_hoist (loop, newpat);
1885
1886                   /* Mark the moved, invariant reg as being allowed to
1887                      share a hard reg with the other matching invariant.  */
1888                   REG_NOTES (i1) = REG_NOTES (m->insn);
1889                   r1 = SET_DEST (PATTERN (m->insn));
1890                   r2 = SET_DEST (PATTERN (m1->insn));
1891                   regs_may_share
1892                     = gen_rtx_EXPR_LIST (VOIDmode, r1,
1893                                          gen_rtx_EXPR_LIST (VOIDmode, r2,
1894                                                             regs_may_share));
1895                   delete_insn (m->insn);
1896
1897                   if (new_start == 0)
1898                     new_start = i1;
1899
1900                   if (loop_dump_stream)
1901                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
1902                 }
1903               /* If we are to re-generate the item being moved with a
1904                  new move insn, first delete what we have and then emit
1905                  the move insn before the loop.  */
1906               else if (m->move_insn)
1907                 {
1908                   rtx i1, temp, seq;
1909
1910                   for (count = m->consec; count >= 0; count--)
1911                     {
1912                       /* If this is the first insn of a library call sequence,
1913                          skip to the end.  */
1914                       if (GET_CODE (p) != NOTE
1915                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
1916                         p = XEXP (temp, 0);
1917
1918                       /* If this is the last insn of a libcall sequence, then
1919                          delete every insn in the sequence except the last.
1920                          The last insn is handled in the normal manner.  */
1921                       if (GET_CODE (p) != NOTE
1922                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
1923                         {
1924                           temp = XEXP (temp, 0);
1925                           while (temp != p)
1926                             temp = delete_insn (temp);
1927                         }
1928
1929                       temp = p;
1930                       p = delete_insn (p);
1931
1932                       /* simplify_giv_expr expects that it can walk the insns
1933                          at m->insn forwards and see this old sequence we are
1934                          tossing here.  delete_insn does preserve the next
1935                          pointers, but when we skip over a NOTE we must fix
1936                          it up.  Otherwise that code walks into the non-deleted
1937                          insn stream.  */
1938                       while (p && GET_CODE (p) == NOTE)
1939                         p = NEXT_INSN (temp) = NEXT_INSN (p);
1940                     }
1941
1942                   start_sequence ();
1943                   emit_move_insn (m->set_dest, m->set_src);
1944                   temp = get_insns ();
1945                   seq = gen_sequence ();
1946                   end_sequence ();
1947
1948                   add_label_notes (m->set_src, temp);
1949
1950                   i1 = loop_insn_hoist (loop, seq);
1951                   if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
1952                     set_unique_reg_note (i1,
1953                                          m->is_equiv ? REG_EQUIV : REG_EQUAL,
1954                                          m->set_src);
1955
1956                   if (loop_dump_stream)
1957                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
1958
1959                   /* The more regs we move, the less we like moving them.  */
1960                   threshold -= 3;
1961                 }
1962               else
1963                 {
1964                   for (count = m->consec; count >= 0; count--)
1965                     {
1966                       rtx i1, temp;
1967
1968                       /* If first insn of libcall sequence, skip to end.  */
1969                       /* Do this at start of loop, since p is guaranteed to
1970                          be an insn here.  */
1971                       if (GET_CODE (p) != NOTE
1972                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
1973                         p = XEXP (temp, 0);
1974
1975                       /* If last insn of libcall sequence, move all
1976                          insns except the last before the loop.  The last
1977                          insn is handled in the normal manner.  */
1978                       if (GET_CODE (p) != NOTE
1979                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
1980                         {
1981                           rtx fn_address = 0;
1982                           rtx fn_reg = 0;
1983                           rtx fn_address_insn = 0;
1984
1985                           first = 0;
1986                           for (temp = XEXP (temp, 0); temp != p;
1987                                temp = NEXT_INSN (temp))
1988                             {
1989                               rtx body;
1990                               rtx n;
1991                               rtx next;
1992
1993                               if (GET_CODE (temp) == NOTE)
1994                                 continue;
1995
1996                               body = PATTERN (temp);
1997
1998                               /* Find the next insn after TEMP,
1999                                  not counting USE or NOTE insns.  */
2000                               for (next = NEXT_INSN (temp); next != p;
2001                                    next = NEXT_INSN (next))
2002                                 if (! (GET_CODE (next) == INSN
2003                                        && GET_CODE (PATTERN (next)) == USE)
2004                                     && GET_CODE (next) != NOTE)
2005                                   break;
2006
2007                               /* If that is the call, this may be the insn
2008                                  that loads the function address.
2009
2010                                  Extract the function address from the insn
2011                                  that loads it into a register.
2012                                  If this insn was cse'd, we get incorrect code.
2013
2014                                  So emit a new move insn that copies the
2015                                  function address into the register that the
2016                                  call insn will use.  flow.c will delete any
2017                                  redundant stores that we have created.  */
2018                               if (GET_CODE (next) == CALL_INSN
2019                                   && GET_CODE (body) == SET
2020                                   && GET_CODE (SET_DEST (body)) == REG
2021                                   && (n = find_reg_note (temp, REG_EQUAL,
2022                                                          NULL_RTX)))
2023                                 {
2024                                   fn_reg = SET_SRC (body);
2025                                   if (GET_CODE (fn_reg) != REG)
2026                                     fn_reg = SET_DEST (body);
2027                                   fn_address = XEXP (n, 0);
2028                                   fn_address_insn = temp;
2029                                 }
2030                               /* We have the call insn.
2031                                  If it uses the register we suspect it might,
2032                                  load it with the correct address directly.  */
2033                               if (GET_CODE (temp) == CALL_INSN
2034                                   && fn_address != 0
2035                                   && reg_referenced_p (fn_reg, body))
2036                                 loop_insn_emit_after (loop, 0, fn_address_insn,
2037                                                       gen_move_insn
2038                                                       (fn_reg, fn_address));
2039
2040                               if (GET_CODE (temp) == CALL_INSN)
2041                                 {
2042                                   i1 = loop_call_insn_hoist (loop, body);
2043                                   /* Because the USAGE information potentially
2044                                      contains objects other than hard registers
2045                                      we need to copy it.  */
2046                                   if (CALL_INSN_FUNCTION_USAGE (temp))
2047                                     CALL_INSN_FUNCTION_USAGE (i1)
2048                                       = copy_rtx (CALL_INSN_FUNCTION_USAGE (temp));
2049                                 }
2050                               else
2051                                 i1 = loop_insn_hoist (loop, body);
2052                               if (first == 0)
2053                                 first = i1;
2054                               if (temp == fn_address_insn)
2055                                 fn_address_insn = i1;
2056                               REG_NOTES (i1) = REG_NOTES (temp);
2057                               REG_NOTES (temp) = NULL;
2058                               delete_insn (temp);
2059                             }
2060                           if (new_start == 0)
2061                             new_start = first;
2062                         }
2063                       if (m->savemode != VOIDmode)
2064                         {
2065                           /* P sets REG to zero; but we should clear only
2066                              the bits that are not covered by the mode
2067                              m->savemode.  */
2068                           rtx reg = m->set_dest;
2069                           rtx sequence;
2070                           rtx tem;
2071
2072                           start_sequence ();
2073                           tem = expand_simple_binop
2074                             (GET_MODE (reg), AND, reg,
2075                              GEN_INT ((((HOST_WIDE_INT) 1
2076                                         << GET_MODE_BITSIZE (m->savemode)))
2077                                       - 1),
2078                              reg, 1, OPTAB_LIB_WIDEN);
2079                           if (tem == 0)
2080                             abort ();
2081                           if (tem != reg)
2082                             emit_move_insn (reg, tem);
2083                           sequence = gen_sequence ();
2084                           end_sequence ();
2085                           i1 = loop_insn_hoist (loop, sequence);
2086                         }
2087                       else if (GET_CODE (p) == CALL_INSN)
2088                         {
2089                           i1 = loop_call_insn_hoist (loop, PATTERN (p));
2090                           /* Because the USAGE information potentially
2091                              contains objects other than hard registers
2092                              we need to copy it.  */
2093                           if (CALL_INSN_FUNCTION_USAGE (p))
2094                             CALL_INSN_FUNCTION_USAGE (i1)
2095                               = copy_rtx (CALL_INSN_FUNCTION_USAGE (p));
2096                         }
2097                       else if (count == m->consec && m->move_insn_first)
2098                         {
2099                           rtx seq;
2100                           /* The SET_SRC might not be invariant, so we must
2101                              use the REG_EQUAL note.  */
2102                           start_sequence ();
2103                           emit_move_insn (m->set_dest, m->set_src);
2104                           temp = get_insns ();
2105                           seq = gen_sequence ();
2106                           end_sequence ();
2107
2108                           add_label_notes (m->set_src, temp);
2109
2110                           i1 = loop_insn_hoist (loop, seq);
2111                           if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2112                             set_unique_reg_note (i1, m->is_equiv ? REG_EQUIV
2113                                                      : REG_EQUAL, m->set_src);
2114                         }
2115                       else
2116                         i1 = loop_insn_hoist (loop, PATTERN (p));
2117
2118                       if (REG_NOTES (i1) == 0)
2119                         {
2120                           REG_NOTES (i1) = REG_NOTES (p);
2121                           REG_NOTES (p) = NULL;
2122
2123                           /* If there is a REG_EQUAL note present whose value
2124                              is not loop invariant, then delete it, since it
2125                              may cause problems with later optimization passes.
2126                              It is possible for cse to create such notes
2127                              like this as a result of record_jump_cond.  */
2128
2129                           if ((temp = find_reg_note (i1, REG_EQUAL, NULL_RTX))
2130                               && ! loop_invariant_p (loop, XEXP (temp, 0)))
2131                             remove_note (i1, temp);
2132                         }
2133
2134                       if (new_start == 0)
2135                         new_start = i1;
2136
2137                       if (loop_dump_stream)
2138                         fprintf (loop_dump_stream, " moved to %d",
2139                                  INSN_UID (i1));
2140
2141                       /* If library call, now fix the REG_NOTES that contain
2142                          insn pointers, namely REG_LIBCALL on FIRST
2143                          and REG_RETVAL on I1.  */
2144                       if ((temp = find_reg_note (i1, REG_RETVAL, NULL_RTX)))
2145                         {
2146                           XEXP (temp, 0) = first;
2147                           temp = find_reg_note (first, REG_LIBCALL, NULL_RTX);
2148                           XEXP (temp, 0) = i1;
2149                         }
2150
2151                       temp = p;
2152                       delete_insn (p);
2153                       p = NEXT_INSN (p);
2154
2155                       /* simplify_giv_expr expects that it can walk the insns
2156                          at m->insn forwards and see this old sequence we are
2157                          tossing here.  delete_insn does preserve the next
2158                          pointers, but when we skip over a NOTE we must fix
2159                          it up.  Otherwise that code walks into the non-deleted
2160                          insn stream.  */
2161                       while (p && GET_CODE (p) == NOTE)
2162                         p = NEXT_INSN (temp) = NEXT_INSN (p);
2163                     }
2164
2165                   /* The more regs we move, the less we like moving them.  */
2166                   threshold -= 3;
2167                 }
2168
2169               /* Any other movable that loads the same register
2170                  MUST be moved.  */
2171               already_moved[regno] = 1;
2172
2173               /* This reg has been moved out of one loop.  */
2174               regs->array[regno].moved_once = 1;
2175
2176               /* The reg set here is now invariant.  */
2177               if (! m->partial)
2178                 {
2179                   int i;
2180                   for (i = 0; i < LOOP_REGNO_NREGS (regno, m->set_dest); i++)
2181                     regs->array[regno+i].set_in_loop = 0;
2182                 }
2183
2184               m->done = 1;
2185
2186               /* Change the length-of-life info for the register
2187                  to say it lives at least the full length of this loop.
2188                  This will help guide optimizations in outer loops.  */
2189
2190               if (REGNO_FIRST_LUID (regno) > INSN_LUID (loop_start))
2191                 /* This is the old insn before all the moved insns.
2192                    We can't use the moved insn because it is out of range
2193                    in uid_luid.  Only the old insns have luids.  */
2194                 REGNO_FIRST_UID (regno) = INSN_UID (loop_start);
2195               if (REGNO_LAST_LUID (regno) < INSN_LUID (loop_end))
2196                 REGNO_LAST_UID (regno) = INSN_UID (loop_end);
2197
2198               /* Combine with this moved insn any other matching movables.  */
2199
2200               if (! m->partial)
2201                 for (m1 = movables->head; m1; m1 = m1->next)
2202                   if (m1->match == m)
2203                     {
2204                       rtx temp;
2205
2206                       /* Schedule the reg loaded by M1
2207                          for replacement so that shares the reg of M.
2208                          If the modes differ (only possible in restricted
2209                          circumstances, make a SUBREG.
2210
2211                          Note this assumes that the target dependent files
2212                          treat REG and SUBREG equally, including within
2213                          GO_IF_LEGITIMATE_ADDRESS and in all the
2214                          predicates since we never verify that replacing the
2215                          original register with a SUBREG results in a
2216                          recognizable insn.  */
2217                       if (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest))
2218                         reg_map[m1->regno] = m->set_dest;
2219                       else
2220                         reg_map[m1->regno]
2221                           = gen_lowpart_common (GET_MODE (m1->set_dest),
2222                                                 m->set_dest);
2223
2224                       /* Get rid of the matching insn
2225                          and prevent further processing of it.  */
2226                       m1->done = 1;
2227
2228                       /* if library call, delete all insns.  */
2229                       if ((temp = find_reg_note (m1->insn, REG_RETVAL,
2230                                                  NULL_RTX)))
2231                         delete_insn_chain (XEXP (temp, 0), m1->insn);
2232                       else
2233                         delete_insn (m1->insn);
2234
2235                       /* Any other movable that loads the same register
2236                          MUST be moved.  */
2237                       already_moved[m1->regno] = 1;
2238
2239                       /* The reg merged here is now invariant,
2240                          if the reg it matches is invariant.  */
2241                       if (! m->partial)
2242                         {
2243                           int i;
2244                           for (i = 0;
2245                                i < LOOP_REGNO_NREGS (regno, m1->set_dest);
2246                                i++)
2247                             regs->array[m1->regno+i].set_in_loop = 0;
2248                         }
2249                     }
2250             }
2251           else if (loop_dump_stream)
2252             fprintf (loop_dump_stream, "not desirable");
2253         }
2254       else if (loop_dump_stream && !m->match)
2255         fprintf (loop_dump_stream, "not safe");
2256
2257       if (loop_dump_stream)
2258         fprintf (loop_dump_stream, "\n");
2259     }
2260
2261   if (new_start == 0)
2262     new_start = loop_start;
2263
2264   /* Go through all the instructions in the loop, making
2265      all the register substitutions scheduled in REG_MAP.  */
2266   for (p = new_start; p != loop_end; p = NEXT_INSN (p))
2267     if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
2268         || GET_CODE (p) == CALL_INSN)
2269       {
2270         replace_regs (PATTERN (p), reg_map, nregs, 0);
2271         replace_regs (REG_NOTES (p), reg_map, nregs, 0);
2272         INSN_CODE (p) = -1;
2273       }
2274
2275   /* Clean up.  */
2276   free (reg_map);
2277   free (already_moved);
2278 }
2279
2280
2281 static void
2282 loop_movables_add (movables, m)
2283      struct loop_movables *movables;
2284      struct movable *m;
2285 {
2286   if (movables->head == 0)
2287     movables->head = m;
2288   else
2289     movables->last->next = m;
2290   movables->last = m;
2291 }
2292
2293
2294 static void
2295 loop_movables_free (movables)
2296      struct loop_movables *movables;
2297 {
2298   struct movable *m;
2299   struct movable *m_next;
2300
2301   for (m = movables->head; m; m = m_next)
2302     {
2303       m_next = m->next;
2304       free (m);
2305     }
2306 }
2307 \f
2308 #if 0
2309 /* Scan X and replace the address of any MEM in it with ADDR.
2310    REG is the address that MEM should have before the replacement.  */
2311
2312 static void
2313 replace_call_address (x, reg, addr)
2314      rtx x, reg, addr;
2315 {
2316   enum rtx_code code;
2317   int i;
2318   const char *fmt;
2319
2320   if (x == 0)
2321     return;
2322   code = GET_CODE (x);
2323   switch (code)
2324     {
2325     case PC:
2326     case CC0:
2327     case CONST_INT:
2328     case CONST_DOUBLE:
2329     case CONST:
2330     case SYMBOL_REF:
2331     case LABEL_REF:
2332     case REG:
2333       return;
2334
2335     case SET:
2336       /* Short cut for very common case.  */
2337       replace_call_address (XEXP (x, 1), reg, addr);
2338       return;
2339
2340     case CALL:
2341       /* Short cut for very common case.  */
2342       replace_call_address (XEXP (x, 0), reg, addr);
2343       return;
2344
2345     case MEM:
2346       /* If this MEM uses a reg other than the one we expected,
2347          something is wrong.  */
2348       if (XEXP (x, 0) != reg)
2349         abort ();
2350       XEXP (x, 0) = addr;
2351       return;
2352
2353     default:
2354       break;
2355     }
2356
2357   fmt = GET_RTX_FORMAT (code);
2358   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2359     {
2360       if (fmt[i] == 'e')
2361         replace_call_address (XEXP (x, i), reg, addr);
2362       else if (fmt[i] == 'E')
2363         {
2364           int j;
2365           for (j = 0; j < XVECLEN (x, i); j++)
2366             replace_call_address (XVECEXP (x, i, j), reg, addr);
2367         }
2368     }
2369 }
2370 #endif
2371 \f
2372 /* Return the number of memory refs to addresses that vary
2373    in the rtx X.  */
2374
2375 static int
2376 count_nonfixed_reads (loop, x)
2377      const struct loop *loop;
2378      rtx x;
2379 {
2380   enum rtx_code code;
2381   int i;
2382   const char *fmt;
2383   int value;
2384
2385   if (x == 0)
2386     return 0;
2387
2388   code = GET_CODE (x);
2389   switch (code)
2390     {
2391     case PC:
2392     case CC0:
2393     case CONST_INT:
2394     case CONST_DOUBLE:
2395     case CONST:
2396     case SYMBOL_REF:
2397     case LABEL_REF:
2398     case REG:
2399       return 0;
2400
2401     case MEM:
2402       return ((loop_invariant_p (loop, XEXP (x, 0)) != 1)
2403               + count_nonfixed_reads (loop, XEXP (x, 0)));
2404
2405     default:
2406       break;
2407     }
2408
2409   value = 0;
2410   fmt = GET_RTX_FORMAT (code);
2411   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2412     {
2413       if (fmt[i] == 'e')
2414         value += count_nonfixed_reads (loop, XEXP (x, i));
2415       if (fmt[i] == 'E')
2416         {
2417           int j;
2418           for (j = 0; j < XVECLEN (x, i); j++)
2419             value += count_nonfixed_reads (loop, XVECEXP (x, i, j));
2420         }
2421     }
2422   return value;
2423 }
2424 \f
2425 /* Scan a loop setting the elements `cont', `vtop', `loops_enclosed',
2426    `has_call', `has_nonconst_call', `has_volatile', `has_tablejump',
2427    `unknown_address_altered', `unknown_constant_address_altered', and
2428    `num_mem_sets' in LOOP.  Also, fill in the array `mems' and the
2429    list `store_mems' in LOOP.  */
2430
2431 static void
2432 prescan_loop (loop)
2433      struct loop *loop;
2434 {
2435   int level = 1;
2436   rtx insn;
2437   struct loop_info *loop_info = LOOP_INFO (loop);
2438   rtx start = loop->start;
2439   rtx end = loop->end;
2440   /* The label after END.  Jumping here is just like falling off the
2441      end of the loop.  We use next_nonnote_insn instead of next_label
2442      as a hedge against the (pathological) case where some actual insn
2443      might end up between the two.  */
2444   rtx exit_target = next_nonnote_insn (end);
2445
2446   loop_info->has_indirect_jump = indirect_jump_in_function;
2447   loop_info->pre_header_has_call = 0;
2448   loop_info->has_call = 0;
2449   loop_info->has_nonconst_call = 0;
2450   loop_info->has_volatile = 0;
2451   loop_info->has_tablejump = 0;
2452   loop_info->has_multiple_exit_targets = 0;
2453   loop->level = 1;
2454
2455   loop_info->unknown_address_altered = 0;
2456   loop_info->unknown_constant_address_altered = 0;
2457   loop_info->store_mems = NULL_RTX;
2458   loop_info->first_loop_store_insn = NULL_RTX;
2459   loop_info->mems_idx = 0;
2460   loop_info->num_mem_sets = 0;
2461
2462
2463   for (insn = start; insn && GET_CODE (insn) != CODE_LABEL;
2464        insn = PREV_INSN (insn))
2465     {
2466       if (GET_CODE (insn) == CALL_INSN)
2467         {
2468           loop_info->pre_header_has_call = 1;
2469           break;
2470         }
2471     }
2472
2473   for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2474        insn = NEXT_INSN (insn))
2475     {
2476       switch (GET_CODE (insn))
2477         {
2478         case NOTE:
2479           if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
2480             {
2481               ++level;
2482               /* Count number of loops contained in this one.  */
2483               loop->level++;
2484             }
2485           else if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_END)
2486             --level;
2487           break;
2488
2489         case CALL_INSN:
2490           if (! CONST_OR_PURE_CALL_P (insn))
2491             {
2492               loop_info->unknown_address_altered = 1;
2493               loop_info->has_nonconst_call = 1;
2494             }
2495           loop_info->has_call = 1;
2496           if (can_throw_internal (insn))
2497             loop_info->has_multiple_exit_targets = 1;
2498           break;
2499
2500         case JUMP_INSN:
2501           if (! loop_info->has_multiple_exit_targets)
2502             {
2503               rtx set = pc_set (insn);
2504
2505               if (set)
2506                 {
2507                   rtx src = SET_SRC (set);
2508                   rtx label1, label2;
2509
2510                   if (GET_CODE (src) == IF_THEN_ELSE)
2511                     {
2512                       label1 = XEXP (src, 1);
2513                       label2 = XEXP (src, 2);
2514                     }
2515                   else
2516                     {
2517                       label1 = src;
2518                       label2 = NULL_RTX;
2519                     }
2520
2521                   do
2522                     {
2523                       if (label1 && label1 != pc_rtx)
2524                         {
2525                           if (GET_CODE (label1) != LABEL_REF)
2526                             {
2527                               /* Something tricky.  */
2528                               loop_info->has_multiple_exit_targets = 1;
2529                               break;
2530                             }
2531                           else if (XEXP (label1, 0) != exit_target
2532                                    && LABEL_OUTSIDE_LOOP_P (label1))
2533                             {
2534                               /* A jump outside the current loop.  */
2535                               loop_info->has_multiple_exit_targets = 1;
2536                               break;
2537                             }
2538                         }
2539
2540                       label1 = label2;
2541                       label2 = NULL_RTX;
2542                     }
2543                   while (label1);
2544                 }
2545               else
2546                 {
2547                   /* A return, or something tricky.  */
2548                   loop_info->has_multiple_exit_targets = 1;
2549                 }
2550             }
2551           /* FALLTHRU */
2552
2553         case INSN:
2554           if (volatile_refs_p (PATTERN (insn)))
2555             loop_info->has_volatile = 1;
2556
2557           if (GET_CODE (insn) == JUMP_INSN
2558               && (GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC
2559                   || GET_CODE (PATTERN (insn)) == ADDR_VEC))
2560             loop_info->has_tablejump = 1;
2561
2562           note_stores (PATTERN (insn), note_addr_stored, loop_info);
2563           if (! loop_info->first_loop_store_insn && loop_info->store_mems)
2564             loop_info->first_loop_store_insn = insn;
2565
2566           if (flag_non_call_exceptions && can_throw_internal (insn))
2567             loop_info->has_multiple_exit_targets = 1;
2568           break;
2569
2570         default:
2571           break;
2572         }
2573     }
2574
2575   /* Now, rescan the loop, setting up the LOOP_MEMS array.  */
2576   if (/* An exception thrown by a called function might land us
2577          anywhere.  */
2578       ! loop_info->has_nonconst_call
2579       /* We don't want loads for MEMs moved to a location before the
2580          one at which their stack memory becomes allocated.  (Note
2581          that this is not a problem for malloc, etc., since those
2582          require actual function calls.  */
2583       && ! current_function_calls_alloca
2584       /* There are ways to leave the loop other than falling off the
2585          end.  */
2586       && ! loop_info->has_multiple_exit_targets)
2587     for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2588          insn = NEXT_INSN (insn))
2589       for_each_rtx (&insn, insert_loop_mem, loop_info);
2590
2591   /* BLKmode MEMs are added to LOOP_STORE_MEM as necessary so
2592      that loop_invariant_p and load_mems can use true_dependence
2593      to determine what is really clobbered.  */
2594   if (loop_info->unknown_address_altered)
2595     {
2596       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
2597
2598       loop_info->store_mems
2599         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
2600     }
2601   if (loop_info->unknown_constant_address_altered)
2602     {
2603       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
2604
2605       RTX_UNCHANGING_P (mem) = 1;
2606       loop_info->store_mems
2607         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
2608     }
2609 }
2610 \f
2611 /* Scan the function looking for loops.  Record the start and end of each loop.
2612    Also mark as invalid loops any loops that contain a setjmp or are branched
2613    to from outside the loop.  */
2614
2615 static void
2616 find_and_verify_loops (f, loops)
2617      rtx f;
2618      struct loops *loops;
2619 {
2620   rtx insn;
2621   rtx label;
2622   int num_loops;
2623   struct loop *current_loop;
2624   struct loop *next_loop;
2625   struct loop *loop;
2626
2627   num_loops = loops->num;
2628
2629   compute_luids (f, NULL_RTX, 0);
2630
2631   /* If there are jumps to undefined labels,
2632      treat them as jumps out of any/all loops.
2633      This also avoids writing past end of tables when there are no loops.  */
2634   uid_loop[0] = NULL;
2635
2636   /* Find boundaries of loops, mark which loops are contained within
2637      loops, and invalidate loops that have setjmp.  */
2638
2639   num_loops = 0;
2640   current_loop = NULL;
2641   for (insn = f; insn; insn = NEXT_INSN (insn))
2642     {
2643       if (GET_CODE (insn) == NOTE)
2644         switch (NOTE_LINE_NUMBER (insn))
2645           {
2646           case NOTE_INSN_LOOP_BEG:
2647             next_loop = loops->array + num_loops;
2648             next_loop->num = num_loops;
2649             num_loops++;
2650             next_loop->start = insn;
2651             next_loop->outer = current_loop;
2652             current_loop = next_loop;
2653             break;
2654
2655           case NOTE_INSN_LOOP_CONT:
2656             current_loop->cont = insn;
2657             break;
2658
2659           case NOTE_INSN_LOOP_VTOP:
2660             current_loop->vtop = insn;
2661             break;
2662
2663           case NOTE_INSN_LOOP_END:
2664             if (! current_loop)
2665               abort ();
2666
2667             current_loop->end = insn;
2668             current_loop = current_loop->outer;
2669             break;
2670
2671           default:
2672             break;
2673           }
2674
2675       if (GET_CODE (insn) == CALL_INSN
2676           && find_reg_note (insn, REG_SETJMP, NULL))
2677         {
2678           /* In this case, we must invalidate our current loop and any
2679              enclosing loop.  */
2680           for (loop = current_loop; loop; loop = loop->outer)
2681             {
2682               loop->invalid = 1;
2683               if (loop_dump_stream)
2684                 fprintf (loop_dump_stream,
2685                          "\nLoop at %d ignored due to setjmp.\n",
2686                          INSN_UID (loop->start));
2687             }
2688         }
2689
2690       /* Note that this will mark the NOTE_INSN_LOOP_END note as being in the
2691          enclosing loop, but this doesn't matter.  */
2692       uid_loop[INSN_UID (insn)] = current_loop;
2693     }
2694
2695   /* Any loop containing a label used in an initializer must be invalidated,
2696      because it can be jumped into from anywhere.  */
2697
2698   for (label = forced_labels; label; label = XEXP (label, 1))
2699     {
2700       for (loop = uid_loop[INSN_UID (XEXP (label, 0))];
2701            loop; loop = loop->outer)
2702         loop->invalid = 1;
2703     }
2704
2705   /* Any loop containing a label used for an exception handler must be
2706      invalidated, because it can be jumped into from anywhere.  */
2707
2708   for (label = exception_handler_labels; label; label = XEXP (label, 1))
2709     {
2710       for (loop = uid_loop[INSN_UID (XEXP (label, 0))];
2711            loop; loop = loop->outer)
2712         loop->invalid = 1;
2713     }
2714
2715   /* Now scan all insn's in the function.  If any JUMP_INSN branches into a
2716      loop that it is not contained within, that loop is marked invalid.
2717      If any INSN or CALL_INSN uses a label's address, then the loop containing
2718      that label is marked invalid, because it could be jumped into from
2719      anywhere.
2720
2721      Also look for blocks of code ending in an unconditional branch that
2722      exits the loop.  If such a block is surrounded by a conditional
2723      branch around the block, move the block elsewhere (see below) and
2724      invert the jump to point to the code block.  This may eliminate a
2725      label in our loop and will simplify processing by both us and a
2726      possible second cse pass.  */
2727
2728   for (insn = f; insn; insn = NEXT_INSN (insn))
2729     if (INSN_P (insn))
2730       {
2731         struct loop *this_loop = uid_loop[INSN_UID (insn)];
2732
2733         if (GET_CODE (insn) == INSN || GET_CODE (insn) == CALL_INSN)
2734           {
2735             rtx note = find_reg_note (insn, REG_LABEL, NULL_RTX);
2736             if (note)
2737               {
2738                 for (loop = uid_loop[INSN_UID (XEXP (note, 0))];
2739                      loop; loop = loop->outer)
2740                   loop->invalid = 1;
2741               }
2742           }
2743
2744         if (GET_CODE (insn) != JUMP_INSN)
2745           continue;
2746
2747         mark_loop_jump (PATTERN (insn), this_loop);
2748
2749         /* See if this is an unconditional branch outside the loop.  */
2750         if (this_loop
2751             && (GET_CODE (PATTERN (insn)) == RETURN
2752                 || (any_uncondjump_p (insn)
2753                     && onlyjump_p (insn)
2754                     && (uid_loop[INSN_UID (JUMP_LABEL (insn))]
2755                         != this_loop)))
2756             && get_max_uid () < max_uid_for_loop)
2757           {
2758             rtx p;
2759             rtx our_next = next_real_insn (insn);
2760             rtx last_insn_to_move = NEXT_INSN (insn);
2761             struct loop *dest_loop;
2762             struct loop *outer_loop = NULL;
2763
2764             /* Go backwards until we reach the start of the loop, a label,
2765                or a JUMP_INSN.  */
2766             for (p = PREV_INSN (insn);
2767                  GET_CODE (p) != CODE_LABEL
2768                  && ! (GET_CODE (p) == NOTE
2769                        && NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
2770                  && GET_CODE (p) != JUMP_INSN;
2771                  p = PREV_INSN (p))
2772               ;
2773
2774             /* Check for the case where we have a jump to an inner nested
2775                loop, and do not perform the optimization in that case.  */
2776
2777             if (JUMP_LABEL (insn))
2778               {
2779                 dest_loop = uid_loop[INSN_UID (JUMP_LABEL (insn))];
2780                 if (dest_loop)
2781                   {
2782                     for (outer_loop = dest_loop; outer_loop;
2783                          outer_loop = outer_loop->outer)
2784                       if (outer_loop == this_loop)
2785                         break;
2786                   }
2787               }
2788
2789             /* Make sure that the target of P is within the current loop.  */
2790
2791             if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p)
2792                 && uid_loop[INSN_UID (JUMP_LABEL (p))] != this_loop)
2793               outer_loop = this_loop;
2794
2795             /* If we stopped on a JUMP_INSN to the next insn after INSN,
2796                we have a block of code to try to move.
2797
2798                We look backward and then forward from the target of INSN
2799                to find a BARRIER at the same loop depth as the target.
2800                If we find such a BARRIER, we make a new label for the start
2801                of the block, invert the jump in P and point it to that label,
2802                and move the block of code to the spot we found.  */
2803
2804             if (! outer_loop
2805                 && GET_CODE (p) == JUMP_INSN
2806                 && JUMP_LABEL (p) != 0
2807                 /* Just ignore jumps to labels that were never emitted.
2808                    These always indicate compilation errors.  */
2809                 && INSN_UID (JUMP_LABEL (p)) != 0
2810                 && any_condjump_p (p) && onlyjump_p (p)
2811                 && next_real_insn (JUMP_LABEL (p)) == our_next
2812                 /* If it's not safe to move the sequence, then we
2813                    mustn't try.  */
2814                 && insns_safe_to_move_p (p, NEXT_INSN (insn),
2815                                          &last_insn_to_move))
2816               {
2817                 rtx target
2818                   = JUMP_LABEL (insn) ? JUMP_LABEL (insn) : get_last_insn ();
2819                 struct loop *target_loop = uid_loop[INSN_UID (target)];
2820                 rtx loc, loc2;
2821                 rtx tmp;
2822
2823                 /* Search for possible garbage past the conditional jumps
2824                    and look for the last barrier.  */
2825                 for (tmp = last_insn_to_move;
2826                      tmp && GET_CODE (tmp) != CODE_LABEL; tmp = NEXT_INSN (tmp))
2827                   if (GET_CODE (tmp) == BARRIER)
2828                     last_insn_to_move = tmp;
2829
2830                 for (loc = target; loc; loc = PREV_INSN (loc))
2831                   if (GET_CODE (loc) == BARRIER
2832                       /* Don't move things inside a tablejump.  */
2833                       && ((loc2 = next_nonnote_insn (loc)) == 0
2834                           || GET_CODE (loc2) != CODE_LABEL
2835                           || (loc2 = next_nonnote_insn (loc2)) == 0
2836                           || GET_CODE (loc2) != JUMP_INSN
2837                           || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
2838                               && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
2839                       && uid_loop[INSN_UID (loc)] == target_loop)
2840                     break;
2841
2842                 if (loc == 0)
2843                   for (loc = target; loc; loc = NEXT_INSN (loc))
2844                     if (GET_CODE (loc) == BARRIER
2845                         /* Don't move things inside a tablejump.  */
2846                         && ((loc2 = next_nonnote_insn (loc)) == 0
2847                             || GET_CODE (loc2) != CODE_LABEL
2848                             || (loc2 = next_nonnote_insn (loc2)) == 0
2849                             || GET_CODE (loc2) != JUMP_INSN
2850                             || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
2851                                 && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
2852                         && uid_loop[INSN_UID (loc)] == target_loop)
2853                       break;
2854
2855                 if (loc)
2856                   {
2857                     rtx cond_label = JUMP_LABEL (p);
2858                     rtx new_label = get_label_after (p);
2859
2860                     /* Ensure our label doesn't go away.  */
2861                     LABEL_NUSES (cond_label)++;
2862
2863                     /* Verify that uid_loop is large enough and that
2864                        we can invert P.  */
2865                     if (invert_jump (p, new_label, 1))
2866                       {
2867                         rtx q, r;
2868
2869                         /* If no suitable BARRIER was found, create a suitable
2870                            one before TARGET.  Since TARGET is a fall through
2871                            path, we'll need to insert an jump around our block
2872                            and add a BARRIER before TARGET.
2873
2874                            This creates an extra unconditional jump outside
2875                            the loop.  However, the benefits of removing rarely
2876                            executed instructions from inside the loop usually
2877                            outweighs the cost of the extra unconditional jump
2878                            outside the loop.  */
2879                         if (loc == 0)
2880                           {
2881                             rtx temp;
2882
2883                             temp = gen_jump (JUMP_LABEL (insn));
2884                             temp = emit_jump_insn_before (temp, target);
2885                             JUMP_LABEL (temp) = JUMP_LABEL (insn);
2886                             LABEL_NUSES (JUMP_LABEL (insn))++;
2887                             loc = emit_barrier_before (target);
2888                           }
2889
2890                         /* Include the BARRIER after INSN and copy the
2891                            block after LOC.  */
2892                         if (squeeze_notes (&new_label, &last_insn_to_move))
2893                           abort ();
2894                         reorder_insns (new_label, last_insn_to_move, loc);
2895
2896                         /* All those insns are now in TARGET_LOOP.  */
2897                         for (q = new_label;
2898                              q != NEXT_INSN (last_insn_to_move);
2899                              q = NEXT_INSN (q))
2900                           uid_loop[INSN_UID (q)] = target_loop;
2901
2902                         /* The label jumped to by INSN is no longer a loop
2903                            exit.  Unless INSN does not have a label (e.g.,
2904                            it is a RETURN insn), search loop->exit_labels
2905                            to find its label_ref, and remove it.  Also turn
2906                            off LABEL_OUTSIDE_LOOP_P bit.  */
2907                         if (JUMP_LABEL (insn))
2908                           {
2909                             for (q = 0, r = this_loop->exit_labels;
2910                                  r;
2911                                  q = r, r = LABEL_NEXTREF (r))
2912                               if (XEXP (r, 0) == JUMP_LABEL (insn))
2913                                 {
2914                                   LABEL_OUTSIDE_LOOP_P (r) = 0;
2915                                   if (q)
2916                                     LABEL_NEXTREF (q) = LABEL_NEXTREF (r);
2917                                   else
2918                                     this_loop->exit_labels = LABEL_NEXTREF (r);
2919                                   break;
2920                                 }
2921
2922                             for (loop = this_loop; loop && loop != target_loop;
2923                                  loop = loop->outer)
2924                               loop->exit_count--;
2925
2926                             /* If we didn't find it, then something is
2927                                wrong.  */
2928                             if (! r)
2929                               abort ();
2930                           }
2931
2932                         /* P is now a jump outside the loop, so it must be put
2933                            in loop->exit_labels, and marked as such.
2934                            The easiest way to do this is to just call
2935                            mark_loop_jump again for P.  */
2936                         mark_loop_jump (PATTERN (p), this_loop);
2937
2938                         /* If INSN now jumps to the insn after it,
2939                            delete INSN.  */
2940                         if (JUMP_LABEL (insn) != 0
2941                             && (next_real_insn (JUMP_LABEL (insn))
2942                                 == next_real_insn (insn)))
2943                           delete_related_insns (insn);
2944                       }
2945
2946                     /* Continue the loop after where the conditional
2947                        branch used to jump, since the only branch insn
2948                        in the block (if it still remains) is an inter-loop
2949                        branch and hence needs no processing.  */
2950                     insn = NEXT_INSN (cond_label);
2951
2952                     if (--LABEL_NUSES (cond_label) == 0)
2953                       delete_related_insns (cond_label);
2954
2955                     /* This loop will be continued with NEXT_INSN (insn).  */
2956                     insn = PREV_INSN (insn);
2957                   }
2958               }
2959           }
2960       }
2961 }
2962
2963 /* If any label in X jumps to a loop different from LOOP_NUM and any of the
2964    loops it is contained in, mark the target loop invalid.
2965
2966    For speed, we assume that X is part of a pattern of a JUMP_INSN.  */
2967
2968 static void
2969 mark_loop_jump (x, loop)
2970      rtx x;
2971      struct loop *loop;
2972 {
2973   struct loop *dest_loop;
2974   struct loop *outer_loop;
2975   int i;
2976
2977   switch (GET_CODE (x))
2978     {
2979     case PC:
2980     case USE:
2981     case CLOBBER:
2982     case REG:
2983     case MEM:
2984     case CONST_INT:
2985     case CONST_DOUBLE:
2986     case RETURN:
2987       return;
2988
2989     case CONST:
2990       /* There could be a label reference in here.  */
2991       mark_loop_jump (XEXP (x, 0), loop);
2992       return;
2993
2994     case PLUS:
2995     case MINUS:
2996     case MULT:
2997       mark_loop_jump (XEXP (x, 0), loop);
2998       mark_loop_jump (XEXP (x, 1), loop);
2999       return;
3000
3001     case LO_SUM:
3002       /* This may refer to a LABEL_REF or SYMBOL_REF.  */
3003       mark_loop_jump (XEXP (x, 1), loop);
3004       return;
3005
3006     case SIGN_EXTEND:
3007     case ZERO_EXTEND:
3008       mark_loop_jump (XEXP (x, 0), loop);
3009       return;
3010
3011     case LABEL_REF:
3012       dest_loop = uid_loop[INSN_UID (XEXP (x, 0))];
3013
3014       /* Link together all labels that branch outside the loop.  This
3015          is used by final_[bg]iv_value and the loop unrolling code.  Also
3016          mark this LABEL_REF so we know that this branch should predict
3017          false.  */
3018
3019       /* A check to make sure the label is not in an inner nested loop,
3020          since this does not count as a loop exit.  */
3021       if (dest_loop)
3022         {
3023           for (outer_loop = dest_loop; outer_loop;
3024                outer_loop = outer_loop->outer)
3025             if (outer_loop == loop)
3026               break;
3027         }
3028       else
3029         outer_loop = NULL;
3030
3031       if (loop && ! outer_loop)
3032         {
3033           LABEL_OUTSIDE_LOOP_P (x) = 1;
3034           LABEL_NEXTREF (x) = loop->exit_labels;
3035           loop->exit_labels = x;
3036
3037           for (outer_loop = loop;
3038                outer_loop && outer_loop != dest_loop;
3039                outer_loop = outer_loop->outer)
3040             outer_loop->exit_count++;
3041         }
3042
3043       /* If this is inside a loop, but not in the current loop or one enclosed
3044          by it, it invalidates at least one loop.  */
3045
3046       if (! dest_loop)
3047         return;
3048
3049       /* We must invalidate every nested loop containing the target of this
3050          label, except those that also contain the jump insn.  */
3051
3052       for (; dest_loop; dest_loop = dest_loop->outer)
3053         {
3054           /* Stop when we reach a loop that also contains the jump insn.  */
3055           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3056             if (dest_loop == outer_loop)
3057               return;
3058
3059           /* If we get here, we know we need to invalidate a loop.  */
3060           if (loop_dump_stream && ! dest_loop->invalid)
3061             fprintf (loop_dump_stream,
3062                      "\nLoop at %d ignored due to multiple entry points.\n",
3063                      INSN_UID (dest_loop->start));
3064
3065           dest_loop->invalid = 1;
3066         }
3067       return;
3068
3069     case SET:
3070       /* If this is not setting pc, ignore.  */
3071       if (SET_DEST (x) == pc_rtx)
3072         mark_loop_jump (SET_SRC (x), loop);
3073       return;
3074
3075     case IF_THEN_ELSE:
3076       mark_loop_jump (XEXP (x, 1), loop);
3077       mark_loop_jump (XEXP (x, 2), loop);
3078       return;
3079
3080     case PARALLEL:
3081     case ADDR_VEC:
3082       for (i = 0; i < XVECLEN (x, 0); i++)
3083         mark_loop_jump (XVECEXP (x, 0, i), loop);
3084       return;
3085
3086     case ADDR_DIFF_VEC:
3087       for (i = 0; i < XVECLEN (x, 1); i++)
3088         mark_loop_jump (XVECEXP (x, 1, i), loop);
3089       return;
3090
3091     default:
3092       /* Strictly speaking this is not a jump into the loop, only a possible
3093          jump out of the loop.  However, we have no way to link the destination
3094          of this jump onto the list of exit labels.  To be safe we mark this
3095          loop and any containing loops as invalid.  */
3096       if (loop)
3097         {
3098           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3099             {
3100               if (loop_dump_stream && ! outer_loop->invalid)
3101                 fprintf (loop_dump_stream,
3102                          "\nLoop at %d ignored due to unknown exit jump.\n",
3103                          INSN_UID (outer_loop->start));
3104               outer_loop->invalid = 1;
3105             }
3106         }
3107       return;
3108     }
3109 }
3110 \f
3111 /* Return nonzero if there is a label in the range from
3112    insn INSN to and including the insn whose luid is END
3113    INSN must have an assigned luid (i.e., it must not have
3114    been previously created by loop.c).  */
3115
3116 static int
3117 labels_in_range_p (insn, end)
3118      rtx insn;
3119      int end;
3120 {
3121   while (insn && INSN_LUID (insn) <= end)
3122     {
3123       if (GET_CODE (insn) == CODE_LABEL)
3124         return 1;
3125       insn = NEXT_INSN (insn);
3126     }
3127
3128   return 0;
3129 }
3130
3131 /* Record that a memory reference X is being set.  */
3132
3133 static void
3134 note_addr_stored (x, y, data)
3135      rtx x;
3136      rtx y ATTRIBUTE_UNUSED;
3137      void *data ATTRIBUTE_UNUSED;
3138 {
3139   struct loop_info *loop_info = data;
3140
3141   if (x == 0 || GET_CODE (x) != MEM)
3142     return;
3143
3144   /* Count number of memory writes.
3145      This affects heuristics in strength_reduce.  */
3146   loop_info->num_mem_sets++;
3147
3148   /* BLKmode MEM means all memory is clobbered.  */
3149   if (GET_MODE (x) == BLKmode)
3150     {
3151       if (RTX_UNCHANGING_P (x))
3152         loop_info->unknown_constant_address_altered = 1;
3153       else
3154         loop_info->unknown_address_altered = 1;
3155
3156       return;
3157     }
3158
3159   loop_info->store_mems = gen_rtx_EXPR_LIST (VOIDmode, x,
3160                                              loop_info->store_mems);
3161 }
3162
3163 /* X is a value modified by an INSN that references a biv inside a loop
3164    exit test (ie, X is somehow related to the value of the biv).  If X
3165    is a pseudo that is used more than once, then the biv is (effectively)
3166    used more than once.  DATA is a pointer to a loop_regs structure.  */
3167
3168 static void
3169 note_set_pseudo_multiple_uses (x, y, data)
3170      rtx x;
3171      rtx y ATTRIBUTE_UNUSED;
3172      void *data;
3173 {
3174   struct loop_regs *regs = (struct loop_regs *) data;
3175
3176   if (x == 0)
3177     return;
3178
3179   while (GET_CODE (x) == STRICT_LOW_PART
3180          || GET_CODE (x) == SIGN_EXTRACT
3181          || GET_CODE (x) == ZERO_EXTRACT
3182          || GET_CODE (x) == SUBREG)
3183     x = XEXP (x, 0);
3184
3185   if (GET_CODE (x) != REG || REGNO (x) < FIRST_PSEUDO_REGISTER)
3186     return;
3187
3188   /* If we do not have usage information, or if we know the register
3189      is used more than once, note that fact for check_dbra_loop.  */
3190   if (REGNO (x) >= max_reg_before_loop
3191       || ! regs->array[REGNO (x)].single_usage
3192       || regs->array[REGNO (x)].single_usage == const0_rtx)
3193     regs->multiple_uses = 1;
3194 }
3195 \f
3196 /* Return nonzero if the rtx X is invariant over the current loop.
3197
3198    The value is 2 if we refer to something only conditionally invariant.
3199
3200    A memory ref is invariant if it is not volatile and does not conflict
3201    with anything stored in `loop_info->store_mems'.  */
3202
3203 int
3204 loop_invariant_p (loop, x)
3205      const struct loop *loop;
3206      rtx x;
3207 {
3208   struct loop_info *loop_info = LOOP_INFO (loop);
3209   struct loop_regs *regs = LOOP_REGS (loop);
3210   int i;
3211   enum rtx_code code;
3212   const char *fmt;
3213   int conditional = 0;
3214   rtx mem_list_entry;
3215
3216   if (x == 0)
3217     return 1;
3218   code = GET_CODE (x);
3219   switch (code)
3220     {
3221     case CONST_INT:
3222     case CONST_DOUBLE:
3223     case SYMBOL_REF:
3224     case CONST:
3225       return 1;
3226
3227     case LABEL_REF:
3228       /* A LABEL_REF is normally invariant, however, if we are unrolling
3229          loops, and this label is inside the loop, then it isn't invariant.
3230          This is because each unrolled copy of the loop body will have
3231          a copy of this label.  If this was invariant, then an insn loading
3232          the address of this label into a register might get moved outside
3233          the loop, and then each loop body would end up using the same label.
3234
3235          We don't know the loop bounds here though, so just fail for all
3236          labels.  */
3237       if (flag_unroll_loops)
3238         return 0;
3239       else
3240         return 1;
3241
3242     case PC:
3243     case CC0:
3244     case UNSPEC_VOLATILE:
3245       return 0;
3246
3247     case REG:
3248       /* We used to check RTX_UNCHANGING_P (x) here, but that is invalid
3249          since the reg might be set by initialization within the loop.  */
3250
3251       if ((x == frame_pointer_rtx || x == hard_frame_pointer_rtx
3252            || x == arg_pointer_rtx || x == pic_offset_table_rtx)
3253           && ! current_function_has_nonlocal_goto)
3254         return 1;
3255
3256       if (LOOP_INFO (loop)->has_call
3257           && REGNO (x) < FIRST_PSEUDO_REGISTER && call_used_regs[REGNO (x)])
3258         return 0;
3259
3260       if (regs->array[REGNO (x)].set_in_loop < 0)
3261         return 2;
3262
3263       return regs->array[REGNO (x)].set_in_loop == 0;
3264
3265     case MEM:
3266       /* Volatile memory references must be rejected.  Do this before
3267          checking for read-only items, so that volatile read-only items
3268          will be rejected also.  */
3269       if (MEM_VOLATILE_P (x))
3270         return 0;
3271
3272       /* See if there is any dependence between a store and this load.  */
3273       mem_list_entry = loop_info->store_mems;
3274       while (mem_list_entry)
3275         {
3276           if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
3277                                x, rtx_varies_p))
3278             return 0;
3279
3280           mem_list_entry = XEXP (mem_list_entry, 1);
3281         }
3282
3283       /* It's not invalidated by a store in memory
3284          but we must still verify the address is invariant.  */
3285       break;
3286
3287     case ASM_OPERANDS:
3288       /* Don't mess with insns declared volatile.  */
3289       if (MEM_VOLATILE_P (x))
3290         return 0;
3291       break;
3292
3293     default:
3294       break;
3295     }
3296
3297   fmt = GET_RTX_FORMAT (code);
3298   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3299     {
3300       if (fmt[i] == 'e')
3301         {
3302           int tem = loop_invariant_p (loop, XEXP (x, i));
3303           if (tem == 0)
3304             return 0;
3305           if (tem == 2)
3306             conditional = 1;
3307         }
3308       else if (fmt[i] == 'E')
3309         {
3310           int j;
3311           for (j = 0; j < XVECLEN (x, i); j++)
3312             {
3313               int tem = loop_invariant_p (loop, XVECEXP (x, i, j));
3314               if (tem == 0)
3315                 return 0;
3316               if (tem == 2)
3317                 conditional = 1;
3318             }
3319
3320         }
3321     }
3322
3323   return 1 + conditional;
3324 }
3325 \f
3326 /* Return nonzero if all the insns in the loop that set REG
3327    are INSN and the immediately following insns,
3328    and if each of those insns sets REG in an invariant way
3329    (not counting uses of REG in them).
3330
3331    The value is 2 if some of these insns are only conditionally invariant.
3332
3333    We assume that INSN itself is the first set of REG
3334    and that its source is invariant.  */
3335
3336 static int
3337 consec_sets_invariant_p (loop, reg, n_sets, insn)
3338      const struct loop *loop;
3339      int n_sets;
3340      rtx reg, insn;
3341 {
3342   struct loop_regs *regs = LOOP_REGS (loop);
3343   rtx p = insn;
3344   unsigned int regno = REGNO (reg);
3345   rtx temp;
3346   /* Number of sets we have to insist on finding after INSN.  */
3347   int count = n_sets - 1;
3348   int old = regs->array[regno].set_in_loop;
3349   int value = 0;
3350   int this;
3351
3352   /* If N_SETS hit the limit, we can't rely on its value.  */
3353   if (n_sets == 127)
3354     return 0;
3355
3356   regs->array[regno].set_in_loop = 0;
3357
3358   while (count > 0)
3359     {
3360       enum rtx_code code;
3361       rtx set;
3362
3363       p = NEXT_INSN (p);
3364       code = GET_CODE (p);
3365
3366       /* If library call, skip to end of it.  */
3367       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
3368         p = XEXP (temp, 0);
3369
3370       this = 0;
3371       if (code == INSN
3372           && (set = single_set (p))
3373           && GET_CODE (SET_DEST (set)) == REG
3374           && REGNO (SET_DEST (set)) == regno)
3375         {
3376           this = loop_invariant_p (loop, SET_SRC (set));
3377           if (this != 0)
3378             value |= this;
3379           else if ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX)))
3380             {
3381               /* If this is a libcall, then any invariant REG_EQUAL note is OK.
3382                  If this is an ordinary insn, then only CONSTANT_P REG_EQUAL
3383                  notes are OK.  */
3384               this = (CONSTANT_P (XEXP (temp, 0))
3385                       || (find_reg_note (p, REG_RETVAL, NULL_RTX)
3386                           && loop_invariant_p (loop, XEXP (temp, 0))));
3387               if (this != 0)
3388                 value |= this;
3389             }
3390         }
3391       if (this != 0)
3392         count--;
3393       else if (code != NOTE)
3394         {
3395           regs->array[regno].set_in_loop = old;
3396           return 0;
3397         }
3398     }
3399
3400   regs->array[regno].set_in_loop = old;
3401   /* If loop_invariant_p ever returned 2, we return 2.  */
3402   return 1 + (value & 2);
3403 }
3404
3405 #if 0
3406 /* I don't think this condition is sufficient to allow INSN
3407    to be moved, so we no longer test it.  */
3408
3409 /* Return 1 if all insns in the basic block of INSN and following INSN
3410    that set REG are invariant according to TABLE.  */
3411
3412 static int
3413 all_sets_invariant_p (reg, insn, table)
3414      rtx reg, insn;
3415      short *table;
3416 {
3417   rtx p = insn;
3418   int regno = REGNO (reg);
3419
3420   while (1)
3421     {
3422       enum rtx_code code;
3423       p = NEXT_INSN (p);
3424       code = GET_CODE (p);
3425       if (code == CODE_LABEL || code == JUMP_INSN)
3426         return 1;
3427       if (code == INSN && GET_CODE (PATTERN (p)) == SET
3428           && GET_CODE (SET_DEST (PATTERN (p))) == REG
3429           && REGNO (SET_DEST (PATTERN (p))) == regno)
3430         {
3431           if (! loop_invariant_p (loop, SET_SRC (PATTERN (p)), table))
3432             return 0;
3433         }
3434     }
3435 }
3436 #endif /* 0 */
3437 \f
3438 /* Look at all uses (not sets) of registers in X.  For each, if it is
3439    the single use, set USAGE[REGNO] to INSN; if there was a previous use in
3440    a different insn, set USAGE[REGNO] to const0_rtx.  */
3441
3442 static void
3443 find_single_use_in_loop (regs, insn, x)
3444      struct loop_regs *regs;
3445      rtx insn;
3446      rtx x;
3447 {
3448   enum rtx_code code = GET_CODE (x);
3449   const char *fmt = GET_RTX_FORMAT (code);
3450   int i, j;
3451
3452   if (code == REG)
3453     regs->array[REGNO (x)].single_usage
3454       = (regs->array[REGNO (x)].single_usage != 0
3455          && regs->array[REGNO (x)].single_usage != insn)
3456         ? const0_rtx : insn;
3457
3458   else if (code == SET)
3459     {
3460       /* Don't count SET_DEST if it is a REG; otherwise count things
3461          in SET_DEST because if a register is partially modified, it won't
3462          show up as a potential movable so we don't care how USAGE is set
3463          for it.  */
3464       if (GET_CODE (SET_DEST (x)) != REG)
3465         find_single_use_in_loop (regs, insn, SET_DEST (x));
3466       find_single_use_in_loop (regs, insn, SET_SRC (x));
3467     }
3468   else
3469     for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3470       {
3471         if (fmt[i] == 'e' && XEXP (x, i) != 0)
3472           find_single_use_in_loop (regs, insn, XEXP (x, i));
3473         else if (fmt[i] == 'E')
3474           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
3475             find_single_use_in_loop (regs, insn, XVECEXP (x, i, j));
3476       }
3477 }
3478 \f
3479 /* Count and record any set in X which is contained in INSN.  Update
3480    REGS->array[I].MAY_NOT_OPTIMIZE and LAST_SET for any register I set
3481    in X.  */
3482
3483 static void
3484 count_one_set (regs, insn, x, last_set)
3485      struct loop_regs *regs;
3486      rtx insn, x;
3487      rtx *last_set;
3488 {
3489   if (GET_CODE (x) == CLOBBER && GET_CODE (XEXP (x, 0)) == REG)
3490     /* Don't move a reg that has an explicit clobber.
3491        It's not worth the pain to try to do it correctly.  */
3492     regs->array[REGNO (XEXP (x, 0))].may_not_optimize = 1;
3493
3494   if (GET_CODE (x) == SET || GET_CODE (x) == CLOBBER)
3495     {
3496       rtx dest = SET_DEST (x);
3497       while (GET_CODE (dest) == SUBREG
3498              || GET_CODE (dest) == ZERO_EXTRACT
3499              || GET_CODE (dest) == SIGN_EXTRACT
3500              || GET_CODE (dest) == STRICT_LOW_PART)
3501         dest = XEXP (dest, 0);
3502       if (GET_CODE (dest) == REG)
3503         {
3504           int i;
3505           int regno = REGNO (dest);
3506           for (i = 0; i < LOOP_REGNO_NREGS (regno, dest); i++)
3507             {
3508               /* If this is the first setting of this reg
3509                  in current basic block, and it was set before,
3510                  it must be set in two basic blocks, so it cannot
3511                  be moved out of the loop.  */
3512               if (regs->array[regno].set_in_loop > 0
3513                   && last_set == 0)
3514                 regs->array[regno+i].may_not_optimize = 1;
3515               /* If this is not first setting in current basic block,
3516                  see if reg was used in between previous one and this.
3517                  If so, neither one can be moved.  */
3518               if (last_set[regno] != 0
3519                   && reg_used_between_p (dest, last_set[regno], insn))
3520                 regs->array[regno+i].may_not_optimize = 1;
3521               if (regs->array[regno+i].set_in_loop < 127)
3522                 ++regs->array[regno+i].set_in_loop;
3523               last_set[regno+i] = insn;
3524             }
3525         }
3526     }
3527 }
3528 \f
3529 /* Given a loop that is bounded by LOOP->START and LOOP->END and that
3530    is entered at LOOP->SCAN_START, return 1 if the register set in SET
3531    contained in insn INSN is used by any insn that precedes INSN in
3532    cyclic order starting from the loop entry point.
3533
3534    We don't want to use INSN_LUID here because if we restrict INSN to those
3535    that have a valid INSN_LUID, it means we cannot move an invariant out
3536    from an inner loop past two loops.  */
3537
3538 static int
3539 loop_reg_used_before_p (loop, set, insn)
3540      const struct loop *loop;
3541      rtx set, insn;
3542 {
3543   rtx reg = SET_DEST (set);
3544   rtx p;
3545
3546   /* Scan forward checking for register usage.  If we hit INSN, we
3547      are done.  Otherwise, if we hit LOOP->END, wrap around to LOOP->START.  */
3548   for (p = loop->scan_start; p != insn; p = NEXT_INSN (p))
3549     {
3550       if (INSN_P (p) && reg_overlap_mentioned_p (reg, PATTERN (p)))
3551         return 1;
3552
3553       if (p == loop->end)
3554         p = loop->start;
3555     }
3556
3557   return 0;
3558 }
3559 \f
3560
3561 /* Information we collect about arrays that we might want to prefetch.  */
3562 struct prefetch_info
3563 {
3564   struct iv_class *class;       /* Class this prefetch is based on.  */
3565   struct induction *giv;        /* GIV this prefetch is based on.  */
3566   rtx base_address;             /* Start prefetching from this address plus
3567                                    index.  */
3568   HOST_WIDE_INT index;
3569   HOST_WIDE_INT stride;         /* Prefetch stride in bytes in each
3570                                    iteration.  */
3571   unsigned int bytes_accesed;   /* Sum of sizes of all acceses to this
3572                                    prefetch area in one iteration.  */
3573   unsigned int total_bytes;     /* Total bytes loop will access in this block.
3574                                    This is set only for loops with known
3575                                    iteration counts and is 0xffffffff
3576                                    otherwise.  */
3577   unsigned int write : 1;       /* 1 for read/write prefetches.  */
3578   unsigned int prefetch_in_loop : 1;
3579                                 /* 1 for those chosen for prefetching.  */
3580   unsigned int prefetch_before_loop : 1;
3581                                 /* 1 for those chosen for prefetching.  */
3582 };
3583
3584 /* Data used by check_store function.  */
3585 struct check_store_data
3586 {
3587   rtx mem_address;
3588   int mem_write;
3589 };
3590
3591 static void check_store PARAMS ((rtx, rtx, void *));
3592 static void emit_prefetch_instructions PARAMS ((struct loop *));
3593 static int rtx_equal_for_prefetch_p PARAMS ((rtx, rtx));
3594
3595 /* Set mem_write when mem_address is found.  Used as callback to
3596    note_stores.  */
3597 static void
3598 check_store (x, pat, data)
3599      rtx x, pat ATTRIBUTE_UNUSED;
3600      void *data;
3601 {
3602   struct check_store_data *d = (struct check_store_data *) data;
3603
3604   if ((GET_CODE (x) == MEM) && rtx_equal_p (d->mem_address, XEXP (x, 0)))
3605     d->mem_write = 1;
3606 }
3607 \f
3608 /* Like rtx_equal_p, but attempts to swap commutative operands.  This is
3609    important to get some addresses combined.  Later more sophisticated
3610    transformations can be added when necesary.
3611
3612    ??? Same trick with swapping operand is done at several other places.
3613    It can be nice to develop some common way to handle this.  */
3614
3615 static int
3616 rtx_equal_for_prefetch_p (x, y)
3617      rtx x, y;
3618 {
3619   int i;
3620   int j;
3621   enum rtx_code code = GET_CODE (x);
3622   const char *fmt;
3623
3624   if (x == y)
3625     return 1;
3626   if (code != GET_CODE (y))
3627     return 0;
3628
3629   code = GET_CODE (x);
3630
3631   if (GET_RTX_CLASS (code) == 'c')
3632     {
3633       return ((rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 0))
3634                && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 1)))
3635               || (rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 1))
3636                   && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 0))));
3637     }
3638   /* Compare the elements.  If any pair of corresponding elements fails to
3639      match, return 0 for the whole thing.  */
3640
3641   fmt = GET_RTX_FORMAT (code);
3642   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3643     {
3644       switch (fmt[i])
3645         {
3646         case 'w':
3647           if (XWINT (x, i) != XWINT (y, i))
3648             return 0;
3649           break;
3650
3651         case 'i':
3652           if (XINT (x, i) != XINT (y, i))
3653             return 0;
3654           break;
3655
3656         case 'E':
3657           /* Two vectors must have the same length.  */
3658           if (XVECLEN (x, i) != XVECLEN (y, i))
3659             return 0;
3660
3661           /* And the corresponding elements must match.  */
3662           for (j = 0; j < XVECLEN (x, i); j++)
3663             if (rtx_equal_for_prefetch_p (XVECEXP (x, i, j),
3664                                           XVECEXP (y, i, j)) == 0)
3665               return 0;
3666           break;
3667
3668         case 'e':
3669           if (rtx_equal_for_prefetch_p (XEXP (x, i), XEXP (y, i)) == 0)
3670             return 0;
3671           break;
3672
3673         case 's':
3674           if (strcmp (XSTR (x, i), XSTR (y, i)))
3675             return 0;
3676           break;
3677
3678         case 'u':
3679           /* These are just backpointers, so they don't matter.  */
3680           break;
3681
3682         case '0':
3683           break;
3684
3685           /* It is believed that rtx's at this level will never
3686              contain anything but integers and other rtx's,
3687              except for within LABEL_REFs and SYMBOL_REFs.  */
3688         default:
3689           abort ();
3690         }
3691     }
3692   return 1;
3693 }
3694 \f
3695 /* Remove constant addition value from the expression X (when present)
3696    and return it.  */
3697
3698 static HOST_WIDE_INT
3699 remove_constant_addition (x)
3700      rtx *x;
3701 {
3702   HOST_WIDE_INT addval = 0;
3703   rtx exp = *x;
3704
3705   /* Avoid clobbering a shared CONST expression.  */
3706   if (GET_CODE (exp) == CONST)
3707     {
3708       if (GET_CODE (XEXP (exp, 0)) == PLUS
3709           && GET_CODE (XEXP (XEXP (exp, 0), 0)) == SYMBOL_REF
3710           && GET_CODE (XEXP (XEXP (exp, 0), 1)) == CONST_INT)
3711         {
3712           *x = XEXP (XEXP (exp, 0), 0);
3713           return INTVAL (XEXP (XEXP (exp, 0), 1));
3714         }
3715       return 0;
3716     }
3717
3718   if (GET_CODE (exp) == CONST_INT)
3719     {
3720       addval = INTVAL (exp);
3721       *x = const0_rtx;
3722     }
3723
3724   /* For plus expression recurse on ourself.  */
3725   else if (GET_CODE (exp) == PLUS)
3726     {
3727       addval += remove_constant_addition (&XEXP (exp, 0));
3728       addval += remove_constant_addition (&XEXP (exp, 1));
3729
3730       /* In case our parameter was constant, remove extra zero from the
3731          expression.  */
3732       if (XEXP (exp, 0) == const0_rtx)
3733         *x = XEXP (exp, 1);
3734       else if (XEXP (exp, 1) == const0_rtx)
3735         *x = XEXP (exp, 0);
3736     }
3737
3738   return addval;
3739 }
3740
3741 /* Attempt to identify accesses to arrays that are most likely to cause cache
3742    misses, and emit prefetch instructions a few prefetch blocks forward.
3743
3744    To detect the arrays we use the GIV information that was collected by the
3745    strength reduction pass.
3746
3747    The prefetch instructions are generated after the GIV information is done
3748    and before the strength reduction process. The new GIVs are injected into
3749    the strength reduction tables, so the prefetch addresses are optimized as
3750    well.
3751
3752    GIVs are split into base address, stride, and constant addition values.
3753    GIVs with the same address, stride and close addition values are combined
3754    into a single prefetch.  Also writes to GIVs are detected, so that prefetch
3755    for write instructions can be used for the block we write to, on machines
3756    that support write prefetches.
3757
3758    Several heuristics are used to determine when to prefetch.  They are
3759    controlled by defined symbols that can be overridden for each target.  */
3760
3761 static void
3762 emit_prefetch_instructions (loop)
3763      struct loop *loop;
3764 {
3765   int num_prefetches = 0;
3766   int num_real_prefetches = 0;
3767   int num_real_write_prefetches = 0;
3768   int ahead;
3769   int i;
3770   struct iv_class *bl;
3771   struct induction *iv;
3772   struct prefetch_info info[MAX_PREFETCHES];
3773   struct loop_ivs *ivs = LOOP_IVS (loop);
3774
3775   if (!HAVE_prefetch)
3776     return;
3777
3778   /* Consider only loops w/o calls.  When a call is done, the loop is probably
3779      slow enough to read the memory.  */
3780   if (PREFETCH_NO_CALL && LOOP_INFO (loop)->has_call)
3781     {
3782       if (loop_dump_stream)
3783         fprintf (loop_dump_stream, "Prefetch: ignoring loop - has call.\n");
3784
3785       return;
3786     }
3787
3788   if (PREFETCH_NO_LOW_LOOPCNT
3789       && LOOP_INFO (loop)->n_iterations
3790       && LOOP_INFO (loop)->n_iterations <= PREFETCH_LOW_LOOPCNT)
3791     {
3792       if (loop_dump_stream)
3793         fprintf (loop_dump_stream,
3794                  "Prefetch: ignoring loop - not enought iterations.\n");
3795       return;
3796     }
3797
3798   /* Search all induction variables and pick those interesting for the prefetch
3799      machinery.  */
3800   for (bl = ivs->list; bl; bl = bl->next)
3801     {
3802       struct induction *biv = bl->biv, *biv1;
3803       int basestride = 0;
3804
3805       biv1 = biv;
3806
3807       /* Expect all BIVs to be executed in each iteration.  This makes our
3808          analysis more conservative.  */
3809       while (biv1)
3810         {
3811           /* Discard non-constant additions that we can't handle well yet, and
3812              BIVs that are executed multiple times; such BIVs ought to be
3813              handled in the nested loop.  We accept not_every_iteration BIVs,
3814              since these only result in larger strides and make our
3815              heuristics more conservative.
3816              ??? What does the last sentence mean?  */
3817           if (GET_CODE (biv->add_val) != CONST_INT)
3818             {
3819               if (loop_dump_stream)
3820                 {
3821                   fprintf (loop_dump_stream,
3822                            "Prefetch: biv %i ignored: non-constant addition at insn %i:",
3823                            REGNO (biv->src_reg), INSN_UID (biv->insn));
3824                   print_rtl (loop_dump_stream, biv->add_val);
3825                   fprintf (loop_dump_stream, "\n");
3826                 }
3827               break;
3828             }
3829
3830           if (biv->maybe_multiple)
3831             {
3832               if (loop_dump_stream)
3833                 {
3834                   fprintf (loop_dump_stream,
3835                            "Prefetch: biv %i ignored: maybe_multiple at insn %i:",
3836                            REGNO (biv->src_reg), INSN_UID (biv->insn));
3837                   print_rtl (loop_dump_stream, biv->add_val);
3838                   fprintf (loop_dump_stream, "\n");
3839                 }
3840               break;
3841             }
3842
3843           basestride += INTVAL (biv1->add_val);
3844           biv1 = biv1->next_iv;
3845         }
3846
3847       if (biv1 || !basestride)
3848         continue;
3849
3850       for (iv = bl->giv; iv; iv = iv->next_iv)
3851         {
3852           rtx address;
3853           rtx temp;
3854           HOST_WIDE_INT index = 0;
3855           int add = 1;
3856           HOST_WIDE_INT stride;
3857           struct check_store_data d;
3858           int size = GET_MODE_SIZE (GET_MODE (iv));
3859
3860           /* There are several reasons why an induction variable is not
3861              interesting to us.  */
3862           if (iv->giv_type != DEST_ADDR
3863               /* We are interested only in constant stride memory references
3864                  in order to be able to compute density easily.  */
3865               || GET_CODE (iv->mult_val) != CONST_INT
3866               /* Don't handle reversed order prefetches, since they are usually
3867                  ineffective.  Later we may be able to reverse such BIVs.  */
3868               || (PREFETCH_NO_REVERSE_ORDER
3869                   && (stride = INTVAL (iv->mult_val) * basestride) < 0)
3870               /* Prefetching of accesses with such an extreme stride is probably
3871                  not worthwhile, either.  */
3872               || (PREFETCH_NO_EXTREME_STRIDE
3873                   && stride > PREFETCH_EXTREME_STRIDE)
3874               /* Ignore GIVs with varying add values; we can't predict the
3875                  value for the next iteration.  */
3876               || !loop_invariant_p (loop, iv->add_val)
3877               /* Ignore GIVs in the nested loops; they ought to have been
3878                  handled already.  */
3879               || iv->maybe_multiple)
3880             {
3881               if (loop_dump_stream)
3882                 fprintf (loop_dump_stream, "Prefetch: Ignoring giv at %i\n",
3883                          INSN_UID (iv->insn));
3884               continue;
3885             }
3886
3887           /* Determine the pointer to the basic array we are examining.  It is
3888              the sum of the BIV's initial value and the GIV's add_val.  */
3889           index = 0;
3890
3891           address = copy_rtx (iv->add_val);
3892           temp = copy_rtx (bl->initial_value);
3893
3894           address = simplify_gen_binary (PLUS, Pmode, temp, address);
3895           index = remove_constant_addition (&address);
3896
3897           index += size;
3898           d.mem_write = 0;
3899           d.mem_address = *iv->location;
3900
3901           /* When the GIV is not always executed, we might be better off by
3902              not dirtying the cache pages.  */
3903           if (PREFETCH_NOT_ALWAYS || iv->always_executed)
3904             note_stores (PATTERN (iv->insn), check_store, &d);
3905
3906           /* Attempt to find another prefetch to the same array and see if we
3907              can merge this one.  */
3908           for (i = 0; i < num_prefetches; i++)
3909             if (rtx_equal_for_prefetch_p (address, info[i].base_address)
3910                 && stride == info[i].stride)
3911               {
3912                 /* In case both access same array (same location
3913                    just with small difference in constant indexes), merge
3914                    the prefetches.  Just do the later and the earlier will
3915                    get prefetched from previous iteration.
3916                    4096 is artificial threshold.  It should not be too small,
3917                    but also not bigger than small portion of memory usually
3918                    traversed by single loop.  */
3919                 if (index >= info[i].index && index - info[i].index < 4096)
3920                   {
3921                     info[i].write |= d.mem_write;
3922                     info[i].bytes_accesed += size;
3923                     info[i].index = index;
3924                     info[i].giv = iv;
3925                     info[i].class = bl;
3926                     info[num_prefetches].base_address = address;
3927                     add = 0;
3928                     break;
3929                   }
3930
3931                 if (index < info[i].index && info[i].index - index < 4096)
3932                   {
3933                     info[i].write |= d.mem_write;
3934                     info[i].bytes_accesed += size;
3935                     add = 0;
3936                     break;
3937                   }
3938               }
3939
3940           /* Merging failed.  */
3941           if (add)
3942             {
3943               info[num_prefetches].giv = iv;
3944               info[num_prefetches].class = bl;
3945               info[num_prefetches].index = index;
3946               info[num_prefetches].stride = stride;
3947               info[num_prefetches].base_address = address;
3948               info[num_prefetches].write = d.mem_write;
3949               info[num_prefetches].bytes_accesed = size;
3950               num_prefetches++;
3951               if (num_prefetches >= MAX_PREFETCHES)
3952                 {
3953                   if (loop_dump_stream)
3954                     fprintf (loop_dump_stream,
3955                              "Maximal number of prefetches exceeded.\n");
3956                   return;
3957                 }
3958             }
3959         }
3960     }
3961
3962   for (i = 0; i < num_prefetches; i++)
3963     {
3964       /* Attempt to calculate the number of bytes fetched by the loop.
3965          Avoid overflow.  */
3966       if (LOOP_INFO (loop)->n_iterations
3967           && ((unsigned HOST_WIDE_INT) (0xffffffff / info[i].stride)
3968               >= LOOP_INFO (loop)->n_iterations))
3969         info[i].total_bytes = info[i].stride * LOOP_INFO (loop)->n_iterations;
3970       else
3971         info[i].total_bytes = 0xffffffff;
3972
3973       /* Prefetch is worthwhile only when the loads/stores are dense.  */
3974       if (PREFETCH_ONLY_DENSE_MEM
3975           && info[i].bytes_accesed * 256 / info[i].stride > PREFETCH_DENSE_MEM
3976           && (info[i].total_bytes / PREFETCH_BLOCK
3977               >= PREFETCH_BLOCKS_BEFORE_LOOP_MIN))
3978         {
3979           info[i].prefetch_before_loop = 1;
3980           info[i].prefetch_in_loop
3981             = (info[i].total_bytes / PREFETCH_BLOCK
3982                > PREFETCH_BLOCKS_BEFORE_LOOP_MAX);
3983         }
3984       else
3985         info[i].prefetch_in_loop = 0, info[i].prefetch_before_loop = 0;
3986
3987       if (info[i].prefetch_in_loop)
3988         {
3989           num_real_prefetches += ((info[i].stride + PREFETCH_BLOCK - 1)
3990                                   / PREFETCH_BLOCK);
3991           if (info[i].write)
3992             num_real_write_prefetches
3993               += (info[i].stride + PREFETCH_BLOCK - 1) / PREFETCH_BLOCK;
3994         }
3995     }
3996
3997   if (loop_dump_stream)
3998     {
3999       for (i = 0; i < num_prefetches; i++)
4000         {
4001           fprintf (loop_dump_stream, "Prefetch insn %i address: ",
4002                    INSN_UID (info[i].giv->insn));
4003           print_rtl (loop_dump_stream, info[i].base_address);
4004           fprintf (loop_dump_stream, " Index: ");
4005           fprintf (loop_dump_stream, HOST_WIDE_INT_PRINT_DEC, info[i].index);
4006           fprintf (loop_dump_stream, " stride: ");
4007           fprintf (loop_dump_stream, HOST_WIDE_INT_PRINT_DEC, info[i].stride);
4008           fprintf (loop_dump_stream,
4009                    " density: %i%% total_bytes: %u%sin loop: %s before: %s\n",
4010                    (int) (info[i].bytes_accesed * 100 / info[i].stride),
4011                    info[i].total_bytes,
4012                    info[i].write ? " read/write " : " read only ",
4013                    info[i].prefetch_in_loop ? "yes" : "no",
4014                    info[i].prefetch_before_loop ? "yes" : "no");
4015         }
4016
4017       fprintf (loop_dump_stream, "Real prefetches needed: %i (write: %i)\n",
4018                num_real_prefetches, num_real_write_prefetches);
4019     }
4020
4021   if (!num_real_prefetches)
4022     return;
4023
4024   ahead = SIMULTANEOUS_PREFETCHES / num_real_prefetches;
4025
4026   if (!ahead)
4027     return;
4028
4029   for (i = 0; i < num_prefetches; i++)
4030     {
4031       if (info[i].prefetch_in_loop)
4032         {
4033           int y;
4034
4035           for (y = 0; y < ((info[i].stride + PREFETCH_BLOCK - 1)
4036                            / PREFETCH_BLOCK); y++)
4037             {
4038               rtx loc = copy_rtx (*info[i].giv->location);
4039               rtx insn;
4040               int bytes_ahead = PREFETCH_BLOCK * (ahead + y);
4041               rtx before_insn = info[i].giv->insn;
4042               rtx prev_insn = PREV_INSN (info[i].giv->insn);
4043
4044               /* We can save some effort by offsetting the address on
4045                  architectures with offsettable memory references.  */
4046               if (offsettable_address_p (0, VOIDmode, loc))
4047                 loc = plus_constant (loc, bytes_ahead);
4048               else
4049                 {
4050                   rtx reg = gen_reg_rtx (Pmode);
4051                   loop_iv_add_mult_emit_before (loop, loc, const1_rtx,
4052                                                 GEN_INT (bytes_ahead), reg,
4053                                                 0, before_insn);
4054                   loc = reg;
4055                 }
4056
4057               /* Make sure the address operand is valid for prefetch.  */
4058               if (! (*insn_data[(int)CODE_FOR_prefetch].operand[0].predicate)
4059                     (loc,
4060                      insn_data[(int)CODE_FOR_prefetch].operand[0].mode))
4061                 loc = force_reg (Pmode, loc);
4062               emit_insn_before (gen_prefetch (loc, GEN_INT (info[i].write),
4063                                               GEN_INT (3)),
4064                                 before_insn);
4065
4066               /* Check all insns emitted and record the new GIV
4067                  information.  */
4068               insn = NEXT_INSN (prev_insn);
4069               while (insn != before_insn)
4070                 {
4071                   insn = check_insn_for_givs (loop, insn,
4072                                               info[i].giv->always_executed,
4073                                               info[i].giv->maybe_multiple);
4074                   insn = NEXT_INSN (insn);
4075                 }
4076             }
4077         }
4078
4079       if (info[i].prefetch_before_loop)
4080         {
4081           int y;
4082
4083           /* Emit INSNs before the loop to fetch the first cache lines.  */
4084           for (y = 0;
4085                (!info[i].prefetch_in_loop || y < ahead)
4086                && y * PREFETCH_BLOCK < (int) info[i].total_bytes; y ++)
4087             {
4088               rtx reg = gen_reg_rtx (Pmode);
4089               rtx loop_start = loop->start;
4090               rtx add_val = simplify_gen_binary (PLUS, Pmode,
4091                                                  info[i].giv->add_val,
4092                                                  GEN_INT (y * PREFETCH_BLOCK));
4093
4094               loop_iv_add_mult_emit_before (loop, info[i].class->initial_value,
4095                                             info[i].giv->mult_val,
4096                                             add_val, reg, 0, loop_start);
4097               emit_insn_before (gen_prefetch (reg, GEN_INT (info[i].write),
4098                                               GEN_INT (3)),
4099                                 loop_start);
4100             }
4101         }
4102     }
4103
4104   return;
4105 }
4106 \f
4107 /* A "basic induction variable" or biv is a pseudo reg that is set
4108    (within this loop) only by incrementing or decrementing it.  */
4109 /* A "general induction variable" or giv is a pseudo reg whose
4110    value is a linear function of a biv.  */
4111
4112 /* Bivs are recognized by `basic_induction_var';
4113    Givs by `general_induction_var'.  */
4114
4115 /* Communication with routines called via `note_stores'.  */
4116
4117 static rtx note_insn;
4118
4119 /* Dummy register to have non-zero DEST_REG for DEST_ADDR type givs.  */
4120
4121 static rtx addr_placeholder;
4122
4123 /* ??? Unfinished optimizations, and possible future optimizations,
4124    for the strength reduction code.  */
4125
4126 /* ??? The interaction of biv elimination, and recognition of 'constant'
4127    bivs, may cause problems.  */
4128
4129 /* ??? Add heuristics so that DEST_ADDR strength reduction does not cause
4130    performance problems.
4131
4132    Perhaps don't eliminate things that can be combined with an addressing
4133    mode.  Find all givs that have the same biv, mult_val, and add_val;
4134    then for each giv, check to see if its only use dies in a following
4135    memory address.  If so, generate a new memory address and check to see
4136    if it is valid.   If it is valid, then store the modified memory address,
4137    otherwise, mark the giv as not done so that it will get its own iv.  */
4138
4139 /* ??? Could try to optimize branches when it is known that a biv is always
4140    positive.  */
4141
4142 /* ??? When replace a biv in a compare insn, we should replace with closest
4143    giv so that an optimized branch can still be recognized by the combiner,
4144    e.g. the VAX acb insn.  */
4145
4146 /* ??? Many of the checks involving uid_luid could be simplified if regscan
4147    was rerun in loop_optimize whenever a register was added or moved.
4148    Also, some of the optimizations could be a little less conservative.  */
4149 \f
4150 /* Scan the loop body and call FNCALL for each insn.  In the addition to the
4151    LOOP and INSN parameters pass MAYBE_MULTIPLE and NOT_EVERY_ITERATION to the
4152    callback.
4153
4154    NOT_EVERY_ITERATION if current insn is not executed at least once for every
4155    loop iteration except for the last one.
4156
4157    MAYBE_MULTIPLE is 1 if current insn may be executed more than once for every
4158    loop iteration.
4159  */
4160 void
4161 for_each_insn_in_loop (loop, fncall)
4162      struct loop *loop;
4163      loop_insn_callback fncall;
4164 {
4165   /* This is 1 if current insn is not executed at least once for every loop
4166      iteration.  */
4167   int not_every_iteration = 0;
4168   int maybe_multiple = 0;
4169   int past_loop_latch = 0;
4170   int loop_depth = 0;
4171   rtx p;
4172
4173   /* If loop_scan_start points to the loop exit test, we have to be wary of
4174      subversive use of gotos inside expression statements.  */
4175   if (prev_nonnote_insn (loop->scan_start) != prev_nonnote_insn (loop->start))
4176     maybe_multiple = back_branch_in_range_p (loop, loop->scan_start);
4177
4178   /* Scan through loop to find all possible bivs.  */
4179
4180   for (p = next_insn_in_loop (loop, loop->scan_start);
4181        p != NULL_RTX;
4182        p = next_insn_in_loop (loop, p))
4183     {
4184       p = fncall (loop, p, not_every_iteration, maybe_multiple);
4185
4186       /* Past CODE_LABEL, we get to insns that may be executed multiple
4187          times.  The only way we can be sure that they can't is if every
4188          jump insn between here and the end of the loop either
4189          returns, exits the loop, is a jump to a location that is still
4190          behind the label, or is a jump to the loop start.  */
4191
4192       if (GET_CODE (p) == CODE_LABEL)
4193         {
4194           rtx insn = p;
4195
4196           maybe_multiple = 0;
4197
4198           while (1)
4199             {
4200               insn = NEXT_INSN (insn);
4201               if (insn == loop->scan_start)
4202                 break;
4203               if (insn == loop->end)
4204                 {
4205                   if (loop->top != 0)
4206                     insn = loop->top;
4207                   else
4208                     break;
4209                   if (insn == loop->scan_start)
4210                     break;
4211                 }
4212
4213               if (GET_CODE (insn) == JUMP_INSN
4214                   && GET_CODE (PATTERN (insn)) != RETURN
4215                   && (!any_condjump_p (insn)
4216                       || (JUMP_LABEL (insn) != 0
4217                           && JUMP_LABEL (insn) != loop->scan_start
4218                           && !loop_insn_first_p (p, JUMP_LABEL (insn)))))
4219                 {
4220                   maybe_multiple = 1;
4221                   break;
4222                 }
4223             }
4224         }
4225
4226       /* Past a jump, we get to insns for which we can't count
4227          on whether they will be executed during each iteration.  */
4228       /* This code appears twice in strength_reduce.  There is also similar
4229          code in scan_loop.  */
4230       if (GET_CODE (p) == JUMP_INSN
4231       /* If we enter the loop in the middle, and scan around to the
4232          beginning, don't set not_every_iteration for that.
4233          This can be any kind of jump, since we want to know if insns
4234          will be executed if the loop is executed.  */
4235           && !(JUMP_LABEL (p) == loop->top
4236              && ((NEXT_INSN (NEXT_INSN (p)) == loop->end
4237                   && any_uncondjump_p (p))
4238                  || (NEXT_INSN (p) == loop->end && any_condjump_p (p)))))
4239         {
4240           rtx label = 0;
4241
4242           /* If this is a jump outside the loop, then it also doesn't
4243              matter.  Check to see if the target of this branch is on the
4244              loop->exits_labels list.  */
4245
4246           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
4247             if (XEXP (label, 0) == JUMP_LABEL (p))
4248               break;
4249
4250           if (!label)
4251             not_every_iteration = 1;
4252         }
4253
4254       else if (GET_CODE (p) == NOTE)
4255         {
4256           /* At the virtual top of a converted loop, insns are again known to
4257              be executed each iteration: logically, the loop begins here
4258              even though the exit code has been duplicated.
4259
4260              Insns are also again known to be executed each iteration at
4261              the LOOP_CONT note.  */
4262           if ((NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_VTOP
4263                || NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_CONT)
4264               && loop_depth == 0)
4265             not_every_iteration = 0;
4266           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
4267             loop_depth++;
4268           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
4269             loop_depth--;
4270         }
4271
4272       /* Note if we pass a loop latch.  If we do, then we can not clear
4273          NOT_EVERY_ITERATION below when we pass the last CODE_LABEL in
4274          a loop since a jump before the last CODE_LABEL may have started
4275          a new loop iteration.
4276
4277          Note that LOOP_TOP is only set for rotated loops and we need
4278          this check for all loops, so compare against the CODE_LABEL
4279          which immediately follows LOOP_START.  */
4280       if (GET_CODE (p) == JUMP_INSN
4281           && JUMP_LABEL (p) == NEXT_INSN (loop->start))
4282         past_loop_latch = 1;
4283
4284       /* Unlike in the code motion pass where MAYBE_NEVER indicates that
4285          an insn may never be executed, NOT_EVERY_ITERATION indicates whether
4286          or not an insn is known to be executed each iteration of the
4287          loop, whether or not any iterations are known to occur.
4288
4289          Therefore, if we have just passed a label and have no more labels
4290          between here and the test insn of the loop, and we have not passed
4291          a jump to the top of the loop, then we know these insns will be
4292          executed each iteration.  */
4293
4294       if (not_every_iteration
4295           && !past_loop_latch
4296           && GET_CODE (p) == CODE_LABEL
4297           && no_labels_between_p (p, loop->end)
4298           && loop_insn_first_p (p, loop->cont))
4299         not_every_iteration = 0;
4300     }
4301 }
4302 \f
4303 static void
4304 loop_bivs_find (loop)
4305      struct loop *loop;
4306 {
4307   struct loop_regs *regs = LOOP_REGS (loop);
4308   struct loop_ivs *ivs = LOOP_IVS (loop);
4309   /* Temporary list pointers for traversing ivs->list.  */
4310   struct iv_class *bl, **backbl;
4311
4312   ivs->list = 0;
4313
4314   for_each_insn_in_loop (loop, check_insn_for_bivs);
4315
4316   /* Scan ivs->list to remove all regs that proved not to be bivs.
4317      Make a sanity check against regs->n_times_set.  */
4318   for (backbl = &ivs->list, bl = *backbl; bl; bl = bl->next)
4319     {
4320       if (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4321           /* Above happens if register modified by subreg, etc.  */
4322           /* Make sure it is not recognized as a basic induction var: */
4323           || regs->array[bl->regno].n_times_set != bl->biv_count
4324           /* If never incremented, it is invariant that we decided not to
4325              move.  So leave it alone.  */
4326           || ! bl->incremented)
4327         {
4328           if (loop_dump_stream)
4329             fprintf (loop_dump_stream, "Biv %d: discarded, %s\n",
4330                      bl->regno,
4331                      (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4332                       ? "not induction variable"
4333                       : (! bl->incremented ? "never incremented"
4334                          : "count error")));
4335
4336           REG_IV_TYPE (ivs, bl->regno) = NOT_BASIC_INDUCT;
4337           *backbl = bl->next;
4338         }
4339       else
4340         {
4341           backbl = &bl->next;
4342
4343           if (loop_dump_stream)
4344             fprintf (loop_dump_stream, "Biv %d: verified\n", bl->regno);
4345         }
4346     }
4347 }
4348
4349
4350 /* Determine how BIVS are initialised by looking through pre-header
4351    extended basic block.  */
4352 static void
4353 loop_bivs_init_find (loop)
4354      struct loop *loop;
4355 {
4356   struct loop_ivs *ivs = LOOP_IVS (loop);
4357   /* Temporary list pointers for traversing ivs->list.  */
4358   struct iv_class *bl;
4359   int call_seen;
4360   rtx p;
4361
4362   /* Find initial value for each biv by searching backwards from loop_start,
4363      halting at first label.  Also record any test condition.  */
4364
4365   call_seen = 0;
4366   for (p = loop->start; p && GET_CODE (p) != CODE_LABEL; p = PREV_INSN (p))
4367     {
4368       rtx test;
4369
4370       note_insn = p;
4371
4372       if (GET_CODE (p) == CALL_INSN)
4373         call_seen = 1;
4374
4375       if (INSN_P (p))
4376         note_stores (PATTERN (p), record_initial, ivs);
4377
4378       /* Record any test of a biv that branches around the loop if no store
4379          between it and the start of loop.  We only care about tests with
4380          constants and registers and only certain of those.  */
4381       if (GET_CODE (p) == JUMP_INSN
4382           && JUMP_LABEL (p) != 0
4383           && next_real_insn (JUMP_LABEL (p)) == next_real_insn (loop->end)
4384           && (test = get_condition_for_loop (loop, p)) != 0
4385           && GET_CODE (XEXP (test, 0)) == REG
4386           && REGNO (XEXP (test, 0)) < max_reg_before_loop
4387           && (bl = REG_IV_CLASS (ivs, REGNO (XEXP (test, 0)))) != 0
4388           && valid_initial_value_p (XEXP (test, 1), p, call_seen, loop->start)
4389           && bl->init_insn == 0)
4390         {
4391           /* If an NE test, we have an initial value!  */
4392           if (GET_CODE (test) == NE)
4393             {
4394               bl->init_insn = p;
4395               bl->init_set = gen_rtx_SET (VOIDmode,
4396                                           XEXP (test, 0), XEXP (test, 1));
4397             }
4398           else
4399             bl->initial_test = test;
4400         }
4401     }
4402 }
4403
4404
4405 /* Look at the each biv and see if we can say anything better about its
4406    initial value from any initializing insns set up above.  (This is done
4407    in two passes to avoid missing SETs in a PARALLEL.)  */
4408 static void
4409 loop_bivs_check (loop)
4410      struct loop *loop;
4411 {
4412   struct loop_ivs *ivs = LOOP_IVS (loop);
4413   /* Temporary list pointers for traversing ivs->list.  */
4414   struct iv_class *bl;
4415   struct iv_class **backbl;
4416
4417   for (backbl = &ivs->list; (bl = *backbl); backbl = &bl->next)
4418     {
4419       rtx src;
4420       rtx note;
4421
4422       if (! bl->init_insn)
4423         continue;
4424
4425       /* IF INIT_INSN has a REG_EQUAL or REG_EQUIV note and the value
4426          is a constant, use the value of that.  */
4427       if (((note = find_reg_note (bl->init_insn, REG_EQUAL, 0)) != NULL
4428            && CONSTANT_P (XEXP (note, 0)))
4429           || ((note = find_reg_note (bl->init_insn, REG_EQUIV, 0)) != NULL
4430               && CONSTANT_P (XEXP (note, 0))))
4431         src = XEXP (note, 0);
4432       else
4433         src = SET_SRC (bl->init_set);
4434
4435       if (loop_dump_stream)
4436         fprintf (loop_dump_stream,
4437                  "Biv %d: initialized at insn %d: initial value ",
4438                  bl->regno, INSN_UID (bl->init_insn));
4439
4440       if ((GET_MODE (src) == GET_MODE (regno_reg_rtx[bl->regno])
4441            || GET_MODE (src) == VOIDmode)
4442           && valid_initial_value_p (src, bl->init_insn,
4443                                     LOOP_INFO (loop)->pre_header_has_call,
4444                                     loop->start))
4445         {
4446           bl->initial_value = src;
4447
4448           if (loop_dump_stream)
4449             {
4450               print_simple_rtl (loop_dump_stream, src);
4451               fputc ('\n', loop_dump_stream);
4452             }
4453         }
4454       /* If we can't make it a giv,
4455          let biv keep initial value of "itself".  */
4456       else if (loop_dump_stream)
4457         fprintf (loop_dump_stream, "is complex\n");
4458     }
4459 }
4460
4461
4462 /* Search the loop for general induction variables.  */
4463
4464 static void
4465 loop_givs_find (loop)
4466      struct loop* loop;
4467 {
4468   for_each_insn_in_loop (loop, check_insn_for_givs);
4469 }
4470
4471
4472 /* For each giv for which we still don't know whether or not it is
4473    replaceable, check to see if it is replaceable because its final value
4474    can be calculated.  */
4475
4476 static void
4477 loop_givs_check (loop)
4478      struct loop *loop;
4479 {
4480   struct loop_ivs *ivs = LOOP_IVS (loop);
4481   struct iv_class *bl;
4482
4483   for (bl = ivs->list; bl; bl = bl->next)
4484     {
4485       struct induction *v;
4486
4487       for (v = bl->giv; v; v = v->next_iv)
4488         if (! v->replaceable && ! v->not_replaceable)
4489           check_final_value (loop, v);
4490     }
4491 }
4492
4493
4494 /* Return non-zero if it is possible to eliminate the biv BL provided
4495    all givs are reduced.  This is possible if either the reg is not
4496    used outside the loop, or we can compute what its final value will
4497    be.  */
4498
4499 static int
4500 loop_biv_eliminable_p (loop, bl, threshold, insn_count)
4501      struct loop *loop;
4502      struct iv_class *bl;
4503      int threshold;
4504      int insn_count;
4505 {
4506   /* For architectures with a decrement_and_branch_until_zero insn,
4507      don't do this if we put a REG_NONNEG note on the endtest for this
4508      biv.  */
4509
4510 #ifdef HAVE_decrement_and_branch_until_zero
4511   if (bl->nonneg)
4512     {
4513       if (loop_dump_stream)
4514         fprintf (loop_dump_stream,
4515                  "Cannot eliminate nonneg biv %d.\n", bl->regno);
4516       return 0;
4517     }
4518 #endif
4519
4520   /* Check that biv is used outside loop or if it has a final value.
4521      Compare against bl->init_insn rather than loop->start.  We aren't
4522      concerned with any uses of the biv between init_insn and
4523      loop->start since these won't be affected by the value of the biv
4524      elsewhere in the function, so long as init_insn doesn't use the
4525      biv itself.  */
4526
4527   if ((REGNO_LAST_LUID (bl->regno) < INSN_LUID (loop->end)
4528        && bl->init_insn
4529        && INSN_UID (bl->init_insn) < max_uid_for_loop
4530        && REGNO_FIRST_LUID (bl->regno) >= INSN_LUID (bl->init_insn)
4531        && ! reg_mentioned_p (bl->biv->dest_reg, SET_SRC (bl->init_set)))
4532       || (bl->final_value = final_biv_value (loop, bl)))
4533     return maybe_eliminate_biv (loop, bl, 0, threshold, insn_count);
4534
4535   if (loop_dump_stream)
4536     {
4537       fprintf (loop_dump_stream,
4538                "Cannot eliminate biv %d.\n",
4539                bl->regno);
4540       fprintf (loop_dump_stream,
4541                "First use: insn %d, last use: insn %d.\n",
4542                REGNO_FIRST_UID (bl->regno),
4543                REGNO_LAST_UID (bl->regno));
4544     }
4545   return 0;
4546 }
4547
4548
4549 /* Reduce each giv of BL that we have decided to reduce.  */
4550
4551 static void
4552 loop_givs_reduce (loop, bl)
4553      struct loop *loop;
4554      struct iv_class *bl;
4555 {
4556   struct induction *v;
4557
4558   for (v = bl->giv; v; v = v->next_iv)
4559     {
4560       struct induction *tv;
4561       if (! v->ignore && v->same == 0)
4562         {
4563           int auto_inc_opt = 0;
4564
4565           /* If the code for derived givs immediately below has already
4566              allocated a new_reg, we must keep it.  */
4567           if (! v->new_reg)
4568             v->new_reg = gen_reg_rtx (v->mode);
4569
4570 #ifdef AUTO_INC_DEC
4571           /* If the target has auto-increment addressing modes, and
4572              this is an address giv, then try to put the increment
4573              immediately after its use, so that flow can create an
4574              auto-increment addressing mode.  */
4575           if (v->giv_type == DEST_ADDR && bl->biv_count == 1
4576               && bl->biv->always_executed && ! bl->biv->maybe_multiple
4577               /* We don't handle reversed biv's because bl->biv->insn
4578                  does not have a valid INSN_LUID.  */
4579               && ! bl->reversed
4580               && v->always_executed && ! v->maybe_multiple
4581               && INSN_UID (v->insn) < max_uid_for_loop)
4582             {
4583               /* If other giv's have been combined with this one, then
4584                  this will work only if all uses of the other giv's occur
4585                  before this giv's insn.  This is difficult to check.
4586
4587                  We simplify this by looking for the common case where
4588                  there is one DEST_REG giv, and this giv's insn is the
4589                  last use of the dest_reg of that DEST_REG giv.  If the
4590                  increment occurs after the address giv, then we can
4591                  perform the optimization.  (Otherwise, the increment
4592                  would have to go before other_giv, and we would not be
4593                  able to combine it with the address giv to get an
4594                  auto-inc address.)  */
4595               if (v->combined_with)
4596                 {
4597                   struct induction *other_giv = 0;
4598
4599                   for (tv = bl->giv; tv; tv = tv->next_iv)
4600                     if (tv->same == v)
4601                       {
4602                         if (other_giv)
4603                           break;
4604                         else
4605                           other_giv = tv;
4606                       }
4607                   if (! tv && other_giv
4608                       && REGNO (other_giv->dest_reg) < max_reg_before_loop
4609                       && (REGNO_LAST_UID (REGNO (other_giv->dest_reg))
4610                           == INSN_UID (v->insn))
4611                       && INSN_LUID (v->insn) < INSN_LUID (bl->biv->insn))
4612                     auto_inc_opt = 1;
4613                 }
4614               /* Check for case where increment is before the address
4615                  giv.  Do this test in "loop order".  */
4616               else if ((INSN_LUID (v->insn) > INSN_LUID (bl->biv->insn)
4617                         && (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
4618                             || (INSN_LUID (bl->biv->insn)
4619                                 > INSN_LUID (loop->scan_start))))
4620                        || (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
4621                            && (INSN_LUID (loop->scan_start)
4622                                < INSN_LUID (bl->biv->insn))))
4623                 auto_inc_opt = -1;
4624               else
4625                 auto_inc_opt = 1;
4626
4627 #ifdef HAVE_cc0
4628               {
4629                 rtx prev;
4630
4631                 /* We can't put an insn immediately after one setting
4632                    cc0, or immediately before one using cc0.  */
4633                 if ((auto_inc_opt == 1 && sets_cc0_p (PATTERN (v->insn)))
4634                     || (auto_inc_opt == -1
4635                         && (prev = prev_nonnote_insn (v->insn)) != 0
4636                         && INSN_P (prev)
4637                         && sets_cc0_p (PATTERN (prev))))
4638                   auto_inc_opt = 0;
4639               }
4640 #endif
4641
4642               if (auto_inc_opt)
4643                 v->auto_inc_opt = 1;
4644             }
4645 #endif
4646
4647           /* For each place where the biv is incremented, add an insn
4648              to increment the new, reduced reg for the giv.  */
4649           for (tv = bl->biv; tv; tv = tv->next_iv)
4650             {
4651               rtx insert_before;
4652
4653               if (! auto_inc_opt)
4654                 insert_before = tv->insn;
4655               else if (auto_inc_opt == 1)
4656                 insert_before = NEXT_INSN (v->insn);
4657               else
4658                 insert_before = v->insn;
4659
4660               if (tv->mult_val == const1_rtx)
4661                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
4662                                               v->new_reg, v->new_reg,
4663                                               0, insert_before);
4664               else /* tv->mult_val == const0_rtx */
4665                 /* A multiply is acceptable here
4666                    since this is presumed to be seldom executed.  */
4667                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
4668                                               v->add_val, v->new_reg,
4669                                               0, insert_before);
4670             }
4671
4672           /* Add code at loop start to initialize giv's reduced reg.  */
4673
4674           loop_iv_add_mult_hoist (loop,
4675                                   extend_value_for_giv (v, bl->initial_value),
4676                                   v->mult_val, v->add_val, v->new_reg);
4677         }
4678     }
4679 }
4680
4681
4682 /* Check for givs whose first use is their definition and whose
4683    last use is the definition of another giv.  If so, it is likely
4684    dead and should not be used to derive another giv nor to
4685    eliminate a biv.  */
4686
4687 static void
4688 loop_givs_dead_check (loop, bl)
4689      struct loop *loop ATTRIBUTE_UNUSED;
4690      struct iv_class *bl;
4691 {
4692   struct induction *v;
4693
4694   for (v = bl->giv; v; v = v->next_iv)
4695     {
4696       if (v->ignore
4697           || (v->same && v->same->ignore))
4698         continue;
4699
4700       if (v->giv_type == DEST_REG
4701           && REGNO_FIRST_UID (REGNO (v->dest_reg)) == INSN_UID (v->insn))
4702         {
4703           struct induction *v1;
4704
4705           for (v1 = bl->giv; v1; v1 = v1->next_iv)
4706             if (REGNO_LAST_UID (REGNO (v->dest_reg)) == INSN_UID (v1->insn))
4707               v->maybe_dead = 1;
4708         }
4709     }
4710 }
4711
4712
4713 static void
4714 loop_givs_rescan (loop, bl, reg_map)
4715      struct loop *loop;
4716      struct iv_class *bl;
4717      rtx *reg_map;
4718 {
4719   struct induction *v;
4720
4721   for (v = bl->giv; v; v = v->next_iv)
4722     {
4723       if (v->same && v->same->ignore)
4724         v->ignore = 1;
4725
4726       if (v->ignore)
4727         continue;
4728
4729       /* Update expression if this was combined, in case other giv was
4730          replaced.  */
4731       if (v->same)
4732         v->new_reg = replace_rtx (v->new_reg,
4733                                   v->same->dest_reg, v->same->new_reg);
4734
4735       /* See if this register is known to be a pointer to something.  If
4736          so, see if we can find the alignment.  First see if there is a
4737          destination register that is a pointer.  If so, this shares the
4738          alignment too.  Next see if we can deduce anything from the
4739          computational information.  If not, and this is a DEST_ADDR
4740          giv, at least we know that it's a pointer, though we don't know
4741          the alignment.  */
4742       if (GET_CODE (v->new_reg) == REG
4743           && v->giv_type == DEST_REG
4744           && REG_POINTER (v->dest_reg))
4745         mark_reg_pointer (v->new_reg,
4746                           REGNO_POINTER_ALIGN (REGNO (v->dest_reg)));
4747       else if (GET_CODE (v->new_reg) == REG
4748                && REG_POINTER (v->src_reg))
4749         {
4750           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->src_reg));
4751
4752           if (align == 0
4753               || GET_CODE (v->add_val) != CONST_INT
4754               || INTVAL (v->add_val) % (align / BITS_PER_UNIT) != 0)
4755             align = 0;
4756
4757           mark_reg_pointer (v->new_reg, align);
4758         }
4759       else if (GET_CODE (v->new_reg) == REG
4760                && GET_CODE (v->add_val) == REG
4761                && REG_POINTER (v->add_val))
4762         {
4763           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->add_val));
4764
4765           if (align == 0 || GET_CODE (v->mult_val) != CONST_INT
4766               || INTVAL (v->mult_val) % (align / BITS_PER_UNIT) != 0)
4767             align = 0;
4768
4769           mark_reg_pointer (v->new_reg, align);
4770         }
4771       else if (GET_CODE (v->new_reg) == REG && v->giv_type == DEST_ADDR)
4772         mark_reg_pointer (v->new_reg, 0);
4773
4774       if (v->giv_type == DEST_ADDR)
4775         /* Store reduced reg as the address in the memref where we found
4776            this giv.  */
4777         validate_change (v->insn, v->location, v->new_reg, 0);
4778       else if (v->replaceable)
4779         {
4780           reg_map[REGNO (v->dest_reg)] = v->new_reg;
4781         }
4782       else
4783         {
4784           /* Not replaceable; emit an insn to set the original giv reg from
4785              the reduced giv, same as above.  */
4786           loop_insn_emit_after (loop, 0, v->insn,
4787                                 gen_move_insn (v->dest_reg, v->new_reg));
4788         }
4789
4790       /* When a loop is reversed, givs which depend on the reversed
4791          biv, and which are live outside the loop, must be set to their
4792          correct final value.  This insn is only needed if the giv is
4793          not replaceable.  The correct final value is the same as the
4794          value that the giv starts the reversed loop with.  */
4795       if (bl->reversed && ! v->replaceable)
4796         loop_iv_add_mult_sink (loop,
4797                                extend_value_for_giv (v, bl->initial_value),
4798                                v->mult_val, v->add_val, v->dest_reg);
4799       else if (v->final_value)
4800         loop_insn_sink_or_swim (loop,
4801                                 gen_move_insn (v->dest_reg, v->final_value));
4802
4803       if (loop_dump_stream)
4804         {
4805           fprintf (loop_dump_stream, "giv at %d reduced to ",
4806                    INSN_UID (v->insn));
4807           print_simple_rtl (loop_dump_stream, v->new_reg);
4808           fprintf (loop_dump_stream, "\n");
4809         }
4810     }
4811 }
4812
4813
4814 static int
4815 loop_giv_reduce_benefit (loop, bl, v, test_reg)
4816      struct loop *loop ATTRIBUTE_UNUSED;
4817      struct iv_class *bl;
4818      struct induction *v;
4819      rtx test_reg;
4820 {
4821   int add_cost;
4822   int benefit;
4823
4824   benefit = v->benefit;
4825   PUT_MODE (test_reg, v->mode);
4826   add_cost = iv_add_mult_cost (bl->biv->add_val, v->mult_val,
4827                                test_reg, test_reg);
4828
4829   /* Reduce benefit if not replaceable, since we will insert a
4830      move-insn to replace the insn that calculates this giv.  Don't do
4831      this unless the giv is a user variable, since it will often be
4832      marked non-replaceable because of the duplication of the exit
4833      code outside the loop.  In such a case, the copies we insert are
4834      dead and will be deleted.  So they don't have a cost.  Similar
4835      situations exist.  */
4836   /* ??? The new final_[bg]iv_value code does a much better job of
4837      finding replaceable giv's, and hence this code may no longer be
4838      necessary.  */
4839   if (! v->replaceable && ! bl->eliminable
4840       && REG_USERVAR_P (v->dest_reg))
4841     benefit -= copy_cost;
4842
4843   /* Decrease the benefit to count the add-insns that we will insert
4844      to increment the reduced reg for the giv.  ??? This can
4845      overestimate the run-time cost of the additional insns, e.g. if
4846      there are multiple basic blocks that increment the biv, but only
4847      one of these blocks is executed during each iteration.  There is
4848      no good way to detect cases like this with the current structure
4849      of the loop optimizer.  This code is more accurate for
4850      determining code size than run-time benefits.  */
4851   benefit -= add_cost * bl->biv_count;
4852
4853   /* Decide whether to strength-reduce this giv or to leave the code
4854      unchanged (recompute it from the biv each time it is used).  This
4855      decision can be made independently for each giv.  */
4856
4857 #ifdef AUTO_INC_DEC
4858   /* Attempt to guess whether autoincrement will handle some of the
4859      new add insns; if so, increase BENEFIT (undo the subtraction of
4860      add_cost that was done above).  */
4861   if (v->giv_type == DEST_ADDR
4862       /* Increasing the benefit is risky, since this is only a guess.
4863          Avoid increasing register pressure in cases where there would
4864          be no other benefit from reducing this giv.  */
4865       && benefit > 0
4866       && GET_CODE (v->mult_val) == CONST_INT)
4867     {
4868       int size = GET_MODE_SIZE (GET_MODE (v->mem));
4869
4870       if (HAVE_POST_INCREMENT
4871           && INTVAL (v->mult_val) == size)
4872         benefit += add_cost * bl->biv_count;
4873       else if (HAVE_PRE_INCREMENT
4874                && INTVAL (v->mult_val) == size)
4875         benefit += add_cost * bl->biv_count;
4876       else if (HAVE_POST_DECREMENT
4877                && -INTVAL (v->mult_val) == size)
4878         benefit += add_cost * bl->biv_count;
4879       else if (HAVE_PRE_DECREMENT
4880                && -INTVAL (v->mult_val) == size)
4881         benefit += add_cost * bl->biv_count;
4882     }
4883 #endif
4884
4885   return benefit;
4886 }
4887
4888
4889 /* Free IV structures for LOOP.  */
4890
4891 static void
4892 loop_ivs_free (loop)
4893      struct loop *loop;
4894 {
4895   struct loop_ivs *ivs = LOOP_IVS (loop);
4896   struct iv_class *iv = ivs->list;
4897
4898   free (ivs->regs);
4899
4900   while (iv)
4901     {
4902       struct iv_class *next = iv->next;
4903       struct induction *induction;
4904       struct induction *next_induction;
4905
4906       for (induction = iv->biv; induction; induction = next_induction)
4907         {
4908           next_induction = induction->next_iv;
4909           free (induction);
4910         }
4911       for (induction = iv->giv; induction; induction = next_induction)
4912         {
4913           next_induction = induction->next_iv;
4914           free (induction);
4915         }
4916
4917       free (iv);
4918       iv = next;
4919     }
4920 }
4921
4922
4923 /* Perform strength reduction and induction variable elimination.
4924
4925    Pseudo registers created during this function will be beyond the
4926    last valid index in several tables including
4927    REGS->ARRAY[I].N_TIMES_SET and REGNO_LAST_UID.  This does not cause a
4928    problem here, because the added registers cannot be givs outside of
4929    their loop, and hence will never be reconsidered.  But scan_loop
4930    must check regnos to make sure they are in bounds.  */
4931
4932 static void
4933 strength_reduce (loop, flags)
4934      struct loop *loop;
4935      int flags;
4936 {
4937   struct loop_info *loop_info = LOOP_INFO (loop);
4938   struct loop_regs *regs = LOOP_REGS (loop);
4939   struct loop_ivs *ivs = LOOP_IVS (loop);
4940   rtx p;
4941   /* Temporary list pointer for traversing ivs->list.  */
4942   struct iv_class *bl;
4943   /* Ratio of extra register life span we can justify
4944      for saving an instruction.  More if loop doesn't call subroutines
4945      since in that case saving an insn makes more difference
4946      and more registers are available.  */
4947   /* ??? could set this to last value of threshold in move_movables */
4948   int threshold = (loop_info->has_call ? 1 : 2) * (3 + n_non_fixed_regs);
4949   /* Map of pseudo-register replacements.  */
4950   rtx *reg_map = NULL;
4951   int reg_map_size;
4952   int unrolled_insn_copies = 0;
4953   rtx test_reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
4954   int insn_count = count_insns_in_loop (loop);
4955
4956   addr_placeholder = gen_reg_rtx (Pmode);
4957
4958   ivs->n_regs = max_reg_before_loop;
4959   ivs->regs = (struct iv *) xcalloc (ivs->n_regs, sizeof (struct iv));
4960
4961   /* Find all BIVs in loop.  */
4962   loop_bivs_find (loop);
4963
4964   /* Exit if there are no bivs.  */
4965   if (! ivs->list)
4966     {
4967       /* Can still unroll the loop anyways, but indicate that there is no
4968          strength reduction info available.  */
4969       if (flags & LOOP_UNROLL)
4970         unroll_loop (loop, insn_count, 0);
4971
4972       loop_ivs_free (loop);
4973       return;
4974     }
4975
4976   /* Determine how BIVS are initialised by looking through pre-header
4977      extended basic block.  */
4978   loop_bivs_init_find (loop);
4979
4980   /* Look at the each biv and see if we can say anything better about its
4981      initial value from any initializing insns set up above.  */
4982   loop_bivs_check (loop);
4983
4984   /* Search the loop for general induction variables.  */
4985   loop_givs_find (loop);
4986
4987   /* Try to calculate and save the number of loop iterations.  This is
4988      set to zero if the actual number can not be calculated.  This must
4989      be called after all giv's have been identified, since otherwise it may
4990      fail if the iteration variable is a giv.  */
4991   loop_iterations (loop);
4992
4993 #ifdef HAVE_prefetch
4994   if (flags & LOOP_PREFETCH)
4995     emit_prefetch_instructions (loop);
4996 #endif
4997
4998   /* Now for each giv for which we still don't know whether or not it is
4999      replaceable, check to see if it is replaceable because its final value
5000      can be calculated.  This must be done after loop_iterations is called,
5001      so that final_giv_value will work correctly.  */
5002   loop_givs_check (loop);
5003
5004   /* Try to prove that the loop counter variable (if any) is always
5005      nonnegative; if so, record that fact with a REG_NONNEG note
5006      so that "decrement and branch until zero" insn can be used.  */
5007   check_dbra_loop (loop, insn_count);
5008
5009   /* Create reg_map to hold substitutions for replaceable giv regs.
5010      Some givs might have been made from biv increments, so look at
5011      ivs->reg_iv_type for a suitable size.  */
5012   reg_map_size = ivs->n_regs;
5013   reg_map = (rtx *) xcalloc (reg_map_size, sizeof (rtx));
5014
5015   /* Examine each iv class for feasibility of strength reduction/induction
5016      variable elimination.  */
5017
5018   for (bl = ivs->list; bl; bl = bl->next)
5019     {
5020       struct induction *v;
5021       int benefit;
5022
5023       /* Test whether it will be possible to eliminate this biv
5024          provided all givs are reduced.  */
5025       bl->eliminable = loop_biv_eliminable_p (loop, bl, threshold, insn_count);
5026
5027       /* This will be true at the end, if all givs which depend on this
5028          biv have been strength reduced.
5029          We can't (currently) eliminate the biv unless this is so.  */
5030       bl->all_reduced = 1;
5031
5032       /* Check each extension dependent giv in this class to see if its
5033          root biv is safe from wrapping in the interior mode.  */
5034       check_ext_dependent_givs (bl, loop_info);
5035
5036       /* Combine all giv's for this iv_class.  */
5037       combine_givs (regs, bl);
5038
5039       for (v = bl->giv; v; v = v->next_iv)
5040         {
5041           struct induction *tv;
5042
5043           if (v->ignore || v->same)
5044             continue;
5045
5046           benefit = loop_giv_reduce_benefit (loop, bl, v, test_reg);
5047
5048           /* If an insn is not to be strength reduced, then set its ignore
5049              flag, and clear bl->all_reduced.  */
5050
5051           /* A giv that depends on a reversed biv must be reduced if it is
5052              used after the loop exit, otherwise, it would have the wrong
5053              value after the loop exit.  To make it simple, just reduce all
5054              of such giv's whether or not we know they are used after the loop
5055              exit.  */
5056
5057           if (! flag_reduce_all_givs
5058               && v->lifetime * threshold * benefit < insn_count
5059               && ! bl->reversed)
5060             {
5061               if (loop_dump_stream)
5062                 fprintf (loop_dump_stream,
5063                          "giv of insn %d not worth while, %d vs %d.\n",
5064                          INSN_UID (v->insn),
5065                          v->lifetime * threshold * benefit, insn_count);
5066               v->ignore = 1;
5067               bl->all_reduced = 0;
5068             }
5069           else
5070             {
5071               /* Check that we can increment the reduced giv without a
5072                  multiply insn.  If not, reject it.  */
5073
5074               for (tv = bl->biv; tv; tv = tv->next_iv)
5075                 if (tv->mult_val == const1_rtx
5076                     && ! product_cheap_p (tv->add_val, v->mult_val))
5077                   {
5078                     if (loop_dump_stream)
5079                       fprintf (loop_dump_stream,
5080                                "giv of insn %d: would need a multiply.\n",
5081                                INSN_UID (v->insn));
5082                     v->ignore = 1;
5083                     bl->all_reduced = 0;
5084                     break;
5085                   }
5086             }
5087         }
5088
5089       /* Check for givs whose first use is their definition and whose
5090          last use is the definition of another giv.  If so, it is likely
5091          dead and should not be used to derive another giv nor to
5092          eliminate a biv.  */
5093       loop_givs_dead_check (loop, bl);
5094
5095       /* Reduce each giv that we decided to reduce.  */
5096       loop_givs_reduce (loop, bl);
5097
5098       /* Rescan all givs.  If a giv is the same as a giv not reduced, mark it
5099          as not reduced.
5100
5101          For each giv register that can be reduced now: if replaceable,
5102          substitute reduced reg wherever the old giv occurs;
5103          else add new move insn "giv_reg = reduced_reg".  */
5104       loop_givs_rescan (loop, bl, reg_map);
5105
5106       /* All the givs based on the biv bl have been reduced if they
5107          merit it.  */
5108
5109       /* For each giv not marked as maybe dead that has been combined with a
5110          second giv, clear any "maybe dead" mark on that second giv.
5111          v->new_reg will either be or refer to the register of the giv it
5112          combined with.
5113
5114          Doing this clearing avoids problems in biv elimination where
5115          a giv's new_reg is a complex value that can't be put in the
5116          insn but the giv combined with (with a reg as new_reg) is
5117          marked maybe_dead.  Since the register will be used in either
5118          case, we'd prefer it be used from the simpler giv.  */
5119
5120       for (v = bl->giv; v; v = v->next_iv)
5121         if (! v->maybe_dead && v->same)
5122           v->same->maybe_dead = 0;
5123
5124       /* Try to eliminate the biv, if it is a candidate.
5125          This won't work if ! bl->all_reduced,
5126          since the givs we planned to use might not have been reduced.
5127
5128          We have to be careful that we didn't initially think we could
5129          eliminate this biv because of a giv that we now think may be
5130          dead and shouldn't be used as a biv replacement.
5131
5132          Also, there is the possibility that we may have a giv that looks
5133          like it can be used to eliminate a biv, but the resulting insn
5134          isn't valid.  This can happen, for example, on the 88k, where a
5135          JUMP_INSN can compare a register only with zero.  Attempts to
5136          replace it with a compare with a constant will fail.
5137
5138          Note that in cases where this call fails, we may have replaced some
5139          of the occurrences of the biv with a giv, but no harm was done in
5140          doing so in the rare cases where it can occur.  */
5141
5142       if (bl->all_reduced == 1 && bl->eliminable
5143           && maybe_eliminate_biv (loop, bl, 1, threshold, insn_count))
5144         {
5145           /* ?? If we created a new test to bypass the loop entirely,
5146              or otherwise drop straight in, based on this test, then
5147              we might want to rewrite it also.  This way some later
5148              pass has more hope of removing the initialization of this
5149              biv entirely.  */
5150
5151           /* If final_value != 0, then the biv may be used after loop end
5152              and we must emit an insn to set it just in case.
5153
5154              Reversed bivs already have an insn after the loop setting their
5155              value, so we don't need another one.  We can't calculate the
5156              proper final value for such a biv here anyways.  */
5157           if (bl->final_value && ! bl->reversed)
5158               loop_insn_sink_or_swim (loop, gen_move_insn
5159                                       (bl->biv->dest_reg, bl->final_value));
5160
5161           if (loop_dump_stream)
5162             fprintf (loop_dump_stream, "Reg %d: biv eliminated\n",
5163                      bl->regno);
5164         }
5165       /* See above note wrt final_value.  But since we couldn't eliminate
5166          the biv, we must set the value after the loop instead of before.  */
5167       else if (bl->final_value && ! bl->reversed)
5168         loop_insn_sink (loop, gen_move_insn (bl->biv->dest_reg,
5169                                              bl->final_value));
5170     }
5171
5172   /* Go through all the instructions in the loop, making all the
5173      register substitutions scheduled in REG_MAP.  */
5174
5175   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
5176     if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
5177         || GET_CODE (p) == CALL_INSN)
5178       {
5179         replace_regs (PATTERN (p), reg_map, reg_map_size, 0);
5180         replace_regs (REG_NOTES (p), reg_map, reg_map_size, 0);
5181         INSN_CODE (p) = -1;
5182       }
5183
5184   if (loop_info->n_iterations > 0)
5185     {
5186       /* When we completely unroll a loop we will likely not need the increment
5187          of the loop BIV and we will not need the conditional branch at the
5188          end of the loop.  */
5189       unrolled_insn_copies = insn_count - 2;
5190
5191 #ifdef HAVE_cc0
5192       /* When we completely unroll a loop on a HAVE_cc0 machine we will not
5193          need the comparison before the conditional branch at the end of the
5194          loop.  */
5195       unrolled_insn_copies -= 1;
5196 #endif
5197
5198       /* We'll need one copy for each loop iteration.  */
5199       unrolled_insn_copies *= loop_info->n_iterations;
5200
5201       /* A little slop to account for the ability to remove initialization
5202          code, better CSE, and other secondary benefits of completely
5203          unrolling some loops.  */
5204       unrolled_insn_copies -= 1;
5205
5206       /* Clamp the value.  */
5207       if (unrolled_insn_copies < 0)
5208         unrolled_insn_copies = 0;
5209     }
5210
5211   /* Unroll loops from within strength reduction so that we can use the
5212      induction variable information that strength_reduce has already
5213      collected.  Always unroll loops that would be as small or smaller
5214      unrolled than when rolled.  */
5215   if ((flags & LOOP_UNROLL)
5216       || (loop_info->n_iterations > 0
5217           && unrolled_insn_copies <= insn_count))
5218     unroll_loop (loop, insn_count, 1);
5219
5220 #ifdef HAVE_doloop_end
5221   if (HAVE_doloop_end && (flags & LOOP_BCT) && flag_branch_on_count_reg)
5222     doloop_optimize (loop);
5223 #endif  /* HAVE_doloop_end  */
5224
5225   /* In case number of iterations is known, drop branch prediction note
5226      in the branch.  Do that only in second loop pass, as loop unrolling
5227      may change the number of iterations performed.  */
5228   if (flags & LOOP_BCT)
5229     {
5230       unsigned HOST_WIDE_INT n
5231         = loop_info->n_iterations / loop_info->unroll_number;
5232       if (n > 1)
5233         predict_insn (PREV_INSN (loop->end), PRED_LOOP_ITERATIONS,
5234                       REG_BR_PROB_BASE - REG_BR_PROB_BASE / n);
5235     }
5236
5237   if (loop_dump_stream)
5238     fprintf (loop_dump_stream, "\n");
5239
5240   loop_ivs_free (loop);
5241   if (reg_map)
5242     free (reg_map);
5243 }
5244 \f
5245 /*Record all basic induction variables calculated in the insn.  */
5246 static rtx
5247 check_insn_for_bivs (loop, p, not_every_iteration, maybe_multiple)
5248      struct loop *loop;
5249      rtx p;
5250      int not_every_iteration;
5251      int maybe_multiple;
5252 {
5253   struct loop_ivs *ivs = LOOP_IVS (loop);
5254   rtx set;
5255   rtx dest_reg;
5256   rtx inc_val;
5257   rtx mult_val;
5258   rtx *location;
5259
5260   if (GET_CODE (p) == INSN
5261       && (set = single_set (p))
5262       && GET_CODE (SET_DEST (set)) == REG)
5263     {
5264       dest_reg = SET_DEST (set);
5265       if (REGNO (dest_reg) < max_reg_before_loop
5266           && REGNO (dest_reg) >= FIRST_PSEUDO_REGISTER
5267           && REG_IV_TYPE (ivs, REGNO (dest_reg)) != NOT_BASIC_INDUCT)
5268         {
5269           if (basic_induction_var (loop, SET_SRC (set),
5270                                    GET_MODE (SET_SRC (set)),
5271                                    dest_reg, p, &inc_val, &mult_val,
5272                                    &location))
5273             {
5274               /* It is a possible basic induction variable.
5275                  Create and initialize an induction structure for it.  */
5276
5277               struct induction *v
5278                 = (struct induction *) xmalloc (sizeof (struct induction));
5279
5280               record_biv (loop, v, p, dest_reg, inc_val, mult_val, location,
5281                           not_every_iteration, maybe_multiple);
5282               REG_IV_TYPE (ivs, REGNO (dest_reg)) = BASIC_INDUCT;
5283             }
5284           else if (REGNO (dest_reg) < ivs->n_regs)
5285             REG_IV_TYPE (ivs, REGNO (dest_reg)) = NOT_BASIC_INDUCT;
5286         }
5287     }
5288   return p;
5289 }
5290 \f
5291 /* Record all givs calculated in the insn.
5292    A register is a giv if: it is only set once, it is a function of a
5293    biv and a constant (or invariant), and it is not a biv.  */
5294 static rtx
5295 check_insn_for_givs (loop, p, not_every_iteration, maybe_multiple)
5296      struct loop *loop;
5297      rtx p;
5298      int not_every_iteration;
5299      int maybe_multiple;
5300 {
5301   struct loop_regs *regs = LOOP_REGS (loop);
5302
5303   rtx set;
5304   /* Look for a general induction variable in a register.  */
5305   if (GET_CODE (p) == INSN
5306       && (set = single_set (p))
5307       && GET_CODE (SET_DEST (set)) == REG
5308       && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
5309     {
5310       rtx src_reg;
5311       rtx dest_reg;
5312       rtx add_val;
5313       rtx mult_val;
5314       rtx ext_val;
5315       int benefit;
5316       rtx regnote = 0;
5317       rtx last_consec_insn;
5318
5319       dest_reg = SET_DEST (set);
5320       if (REGNO (dest_reg) < FIRST_PSEUDO_REGISTER)
5321         return p;
5322
5323       if (/* SET_SRC is a giv.  */
5324           (general_induction_var (loop, SET_SRC (set), &src_reg, &add_val,
5325                                   &mult_val, &ext_val, 0, &benefit, VOIDmode)
5326            /* Equivalent expression is a giv.  */
5327            || ((regnote = find_reg_note (p, REG_EQUAL, NULL_RTX))
5328                && general_induction_var (loop, XEXP (regnote, 0), &src_reg,
5329                                          &add_val, &mult_val, &ext_val, 0,
5330                                          &benefit, VOIDmode)))
5331           /* Don't try to handle any regs made by loop optimization.
5332              We have nothing on them in regno_first_uid, etc.  */
5333           && REGNO (dest_reg) < max_reg_before_loop
5334           /* Don't recognize a BASIC_INDUCT_VAR here.  */
5335           && dest_reg != src_reg
5336           /* This must be the only place where the register is set.  */
5337           && (regs->array[REGNO (dest_reg)].n_times_set == 1
5338               /* or all sets must be consecutive and make a giv.  */
5339               || (benefit = consec_sets_giv (loop, benefit, p,
5340                                              src_reg, dest_reg,
5341                                              &add_val, &mult_val, &ext_val,
5342                                              &last_consec_insn))))
5343         {
5344           struct induction *v
5345             = (struct induction *) xmalloc (sizeof (struct induction));
5346
5347           /* If this is a library call, increase benefit.  */
5348           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
5349             benefit += libcall_benefit (p);
5350
5351           /* Skip the consecutive insns, if there are any.  */
5352           if (regs->array[REGNO (dest_reg)].n_times_set != 1)
5353             p = last_consec_insn;
5354
5355           record_giv (loop, v, p, src_reg, dest_reg, mult_val, add_val,
5356                       ext_val, benefit, DEST_REG, not_every_iteration,
5357                       maybe_multiple, (rtx*) 0);
5358
5359         }
5360     }
5361
5362 #ifndef DONT_REDUCE_ADDR
5363   /* Look for givs which are memory addresses.  */
5364   /* This resulted in worse code on a VAX 8600.  I wonder if it
5365      still does.  */
5366   if (GET_CODE (p) == INSN)
5367     find_mem_givs (loop, PATTERN (p), p, not_every_iteration,
5368                    maybe_multiple);
5369 #endif
5370
5371   /* Update the status of whether giv can derive other givs.  This can
5372      change when we pass a label or an insn that updates a biv.  */
5373   if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
5374       || GET_CODE (p) == CODE_LABEL)
5375     update_giv_derive (loop, p);
5376   return p;
5377 }
5378 \f
5379 /* Return 1 if X is a valid source for an initial value (or as value being
5380    compared against in an initial test).
5381
5382    X must be either a register or constant and must not be clobbered between
5383    the current insn and the start of the loop.
5384
5385    INSN is the insn containing X.  */
5386
5387 static int
5388 valid_initial_value_p (x, insn, call_seen, loop_start)
5389      rtx x;
5390      rtx insn;
5391      int call_seen;
5392      rtx loop_start;
5393 {
5394   if (CONSTANT_P (x))
5395     return 1;
5396
5397   /* Only consider pseudos we know about initialized in insns whose luids
5398      we know.  */
5399   if (GET_CODE (x) != REG
5400       || REGNO (x) >= max_reg_before_loop)
5401     return 0;
5402
5403   /* Don't use call-clobbered registers across a call which clobbers it.  On
5404      some machines, don't use any hard registers at all.  */
5405   if (REGNO (x) < FIRST_PSEUDO_REGISTER
5406       && (SMALL_REGISTER_CLASSES
5407           || (call_used_regs[REGNO (x)] && call_seen)))
5408     return 0;
5409
5410   /* Don't use registers that have been clobbered before the start of the
5411      loop.  */
5412   if (reg_set_between_p (x, insn, loop_start))
5413     return 0;
5414
5415   return 1;
5416 }
5417 \f
5418 /* Scan X for memory refs and check each memory address
5419    as a possible giv.  INSN is the insn whose pattern X comes from.
5420    NOT_EVERY_ITERATION is 1 if the insn might not be executed during
5421    every loop iteration.  MAYBE_MULTIPLE is 1 if the insn might be executed
5422    more thanonce in each loop iteration.  */
5423
5424 static void
5425 find_mem_givs (loop, x, insn, not_every_iteration, maybe_multiple)
5426      const struct loop *loop;
5427      rtx x;
5428      rtx insn;
5429      int not_every_iteration, maybe_multiple;
5430 {
5431   int i, j;
5432   enum rtx_code code;
5433   const char *fmt;
5434
5435   if (x == 0)
5436     return;
5437
5438   code = GET_CODE (x);
5439   switch (code)
5440     {
5441     case REG:
5442     case CONST_INT:
5443     case CONST:
5444     case CONST_DOUBLE:
5445     case SYMBOL_REF:
5446     case LABEL_REF:
5447     case PC:
5448     case CC0:
5449     case ADDR_VEC:
5450     case ADDR_DIFF_VEC:
5451     case USE:
5452     case CLOBBER:
5453       return;
5454
5455     case MEM:
5456       {
5457         rtx src_reg;
5458         rtx add_val;
5459         rtx mult_val;
5460         rtx ext_val;
5461         int benefit;
5462
5463         /* This code used to disable creating GIVs with mult_val == 1 and
5464            add_val == 0.  However, this leads to lost optimizations when
5465            it comes time to combine a set of related DEST_ADDR GIVs, since
5466            this one would not be seen.  */
5467
5468         if (general_induction_var (loop, XEXP (x, 0), &src_reg, &add_val,
5469                                    &mult_val, &ext_val, 1, &benefit,
5470                                    GET_MODE (x)))
5471           {
5472             /* Found one; record it.  */
5473             struct induction *v
5474               = (struct induction *) xmalloc (sizeof (struct induction));
5475
5476             record_giv (loop, v, insn, src_reg, addr_placeholder, mult_val,
5477                         add_val, ext_val, benefit, DEST_ADDR,
5478                         not_every_iteration, maybe_multiple, &XEXP (x, 0));
5479
5480             v->mem = x;
5481           }
5482       }
5483       return;
5484
5485     default:
5486       break;
5487     }
5488
5489   /* Recursively scan the subexpressions for other mem refs.  */
5490
5491   fmt = GET_RTX_FORMAT (code);
5492   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
5493     if (fmt[i] == 'e')
5494       find_mem_givs (loop, XEXP (x, i), insn, not_every_iteration,
5495                      maybe_multiple);
5496     else if (fmt[i] == 'E')
5497       for (j = 0; j < XVECLEN (x, i); j++)
5498         find_mem_givs (loop, XVECEXP (x, i, j), insn, not_every_iteration,
5499                        maybe_multiple);
5500 }
5501 \f
5502 /* Fill in the data about one biv update.
5503    V is the `struct induction' in which we record the biv.  (It is
5504    allocated by the caller, with alloca.)
5505    INSN is the insn that sets it.
5506    DEST_REG is the biv's reg.
5507
5508    MULT_VAL is const1_rtx if the biv is being incremented here, in which case
5509    INC_VAL is the increment.  Otherwise, MULT_VAL is const0_rtx and the biv is
5510    being set to INC_VAL.
5511
5512    NOT_EVERY_ITERATION is nonzero if this biv update is not know to be
5513    executed every iteration; MAYBE_MULTIPLE is nonzero if this biv update
5514    can be executed more than once per iteration.  If MAYBE_MULTIPLE
5515    and NOT_EVERY_ITERATION are both zero, we know that the biv update is
5516    executed exactly once per iteration.  */
5517
5518 static void
5519 record_biv (loop, v, insn, dest_reg, inc_val, mult_val, location,
5520             not_every_iteration, maybe_multiple)
5521      struct loop *loop;
5522      struct induction *v;
5523      rtx insn;
5524      rtx dest_reg;
5525      rtx inc_val;
5526      rtx mult_val;
5527      rtx *location;
5528      int not_every_iteration;
5529      int maybe_multiple;
5530 {
5531   struct loop_ivs *ivs = LOOP_IVS (loop);
5532   struct iv_class *bl;
5533
5534   v->insn = insn;
5535   v->src_reg = dest_reg;
5536   v->dest_reg = dest_reg;
5537   v->mult_val = mult_val;
5538   v->add_val = inc_val;
5539   v->ext_dependent = NULL_RTX;
5540   v->location = location;
5541   v->mode = GET_MODE (dest_reg);
5542   v->always_computable = ! not_every_iteration;
5543   v->always_executed = ! not_every_iteration;
5544   v->maybe_multiple = maybe_multiple;
5545
5546   /* Add this to the reg's iv_class, creating a class
5547      if this is the first incrementation of the reg.  */
5548
5549   bl = REG_IV_CLASS (ivs, REGNO (dest_reg));
5550   if (bl == 0)
5551     {
5552       /* Create and initialize new iv_class.  */
5553
5554       bl = (struct iv_class *) xmalloc (sizeof (struct iv_class));
5555
5556       bl->regno = REGNO (dest_reg);
5557       bl->biv = 0;
5558       bl->giv = 0;
5559       bl->biv_count = 0;
5560       bl->giv_count = 0;
5561
5562       /* Set initial value to the reg itself.  */
5563       bl->initial_value = dest_reg;
5564       bl->final_value = 0;
5565       /* We haven't seen the initializing insn yet */
5566       bl->init_insn = 0;
5567       bl->init_set = 0;
5568       bl->initial_test = 0;
5569       bl->incremented = 0;
5570       bl->eliminable = 0;
5571       bl->nonneg = 0;
5572       bl->reversed = 0;
5573       bl->total_benefit = 0;
5574
5575       /* Add this class to ivs->list.  */
5576       bl->next = ivs->list;
5577       ivs->list = bl;
5578
5579       /* Put it in the array of biv register classes.  */
5580       REG_IV_CLASS (ivs, REGNO (dest_reg)) = bl;
5581     }
5582
5583   /* Update IV_CLASS entry for this biv.  */
5584   v->next_iv = bl->biv;
5585   bl->biv = v;
5586   bl->biv_count++;
5587   if (mult_val == const1_rtx)
5588     bl->incremented = 1;
5589
5590   if (loop_dump_stream)
5591     loop_biv_dump (v, loop_dump_stream, 0);
5592 }
5593 \f
5594 /* Fill in the data about one giv.
5595    V is the `struct induction' in which we record the giv.  (It is
5596    allocated by the caller, with alloca.)
5597    INSN is the insn that sets it.
5598    BENEFIT estimates the savings from deleting this insn.
5599    TYPE is DEST_REG or DEST_ADDR; it says whether the giv is computed
5600    into a register or is used as a memory address.
5601
5602    SRC_REG is the biv reg which the giv is computed from.
5603    DEST_REG is the giv's reg (if the giv is stored in a reg).
5604    MULT_VAL and ADD_VAL are the coefficients used to compute the giv.
5605    LOCATION points to the place where this giv's value appears in INSN.  */
5606
5607 static void
5608 record_giv (loop, v, insn, src_reg, dest_reg, mult_val, add_val, ext_val,
5609             benefit, type, not_every_iteration, maybe_multiple, location)
5610      const struct loop *loop;
5611      struct induction *v;
5612      rtx insn;
5613      rtx src_reg;
5614      rtx dest_reg;
5615      rtx mult_val, add_val, ext_val;
5616      int benefit;
5617      enum g_types type;
5618      int not_every_iteration, maybe_multiple;
5619      rtx *location;
5620 {
5621   struct loop_ivs *ivs = LOOP_IVS (loop);
5622   struct induction *b;
5623   struct iv_class *bl;
5624   rtx set = single_set (insn);
5625   rtx temp;
5626
5627   /* Attempt to prove constantness of the values.  Don't let simplity_rtx
5628      undo the MULT canonicalization that we performed earlier.  */
5629   temp = simplify_rtx (add_val);
5630   if (temp
5631       && ! (GET_CODE (add_val) == MULT
5632             && GET_CODE (temp) == ASHIFT))
5633     add_val = temp;
5634
5635   v->insn = insn;
5636   v->src_reg = src_reg;
5637   v->giv_type = type;
5638   v->dest_reg = dest_reg;
5639   v->mult_val = mult_val;
5640   v->add_val = add_val;
5641   v->ext_dependent = ext_val;
5642   v->benefit = benefit;
5643   v->location = location;
5644   v->cant_derive = 0;
5645   v->combined_with = 0;
5646   v->maybe_multiple = maybe_multiple;
5647   v->maybe_dead = 0;
5648   v->derive_adjustment = 0;
5649   v->same = 0;
5650   v->ignore = 0;
5651   v->new_reg = 0;
5652   v->final_value = 0;
5653   v->same_insn = 0;
5654   v->auto_inc_opt = 0;
5655   v->unrolled = 0;
5656   v->shared = 0;
5657
5658   /* The v->always_computable field is used in update_giv_derive, to
5659      determine whether a giv can be used to derive another giv.  For a
5660      DEST_REG giv, INSN computes a new value for the giv, so its value
5661      isn't computable if INSN insn't executed every iteration.
5662      However, for a DEST_ADDR giv, INSN merely uses the value of the giv;
5663      it does not compute a new value.  Hence the value is always computable
5664      regardless of whether INSN is executed each iteration.  */
5665
5666   if (type == DEST_ADDR)
5667     v->always_computable = 1;
5668   else
5669     v->always_computable = ! not_every_iteration;
5670
5671   v->always_executed = ! not_every_iteration;
5672
5673   if (type == DEST_ADDR)
5674     {
5675       v->mode = GET_MODE (*location);
5676       v->lifetime = 1;
5677     }
5678   else /* type == DEST_REG */
5679     {
5680       v->mode = GET_MODE (SET_DEST (set));
5681
5682       v->lifetime = LOOP_REG_LIFETIME (loop, REGNO (dest_reg));
5683
5684       /* If the lifetime is zero, it means that this register is
5685          really a dead store.  So mark this as a giv that can be
5686          ignored.  This will not prevent the biv from being eliminated.  */
5687       if (v->lifetime == 0)
5688         v->ignore = 1;
5689
5690       REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
5691       REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
5692     }
5693
5694   /* Add the giv to the class of givs computed from one biv.  */
5695
5696   bl = REG_IV_CLASS (ivs, REGNO (src_reg));
5697   if (bl)
5698     {
5699       v->next_iv = bl->giv;
5700       bl->giv = v;
5701       /* Don't count DEST_ADDR.  This is supposed to count the number of
5702          insns that calculate givs.  */
5703       if (type == DEST_REG)
5704         bl->giv_count++;
5705       bl->total_benefit += benefit;
5706     }
5707   else
5708     /* Fatal error, biv missing for this giv?  */
5709     abort ();
5710
5711   if (type == DEST_ADDR)
5712     v->replaceable = 1;
5713   else
5714     {
5715       /* The giv can be replaced outright by the reduced register only if all
5716          of the following conditions are true:
5717          - the insn that sets the giv is always executed on any iteration
5718            on which the giv is used at all
5719            (there are two ways to deduce this:
5720             either the insn is executed on every iteration,
5721             or all uses follow that insn in the same basic block),
5722          - the giv is not used outside the loop
5723          - no assignments to the biv occur during the giv's lifetime.  */
5724
5725       if (REGNO_FIRST_UID (REGNO (dest_reg)) == INSN_UID (insn)
5726           /* Previous line always fails if INSN was moved by loop opt.  */
5727           && REGNO_LAST_LUID (REGNO (dest_reg))
5728           < INSN_LUID (loop->end)
5729           && (! not_every_iteration
5730               || last_use_this_basic_block (dest_reg, insn)))
5731         {
5732           /* Now check that there are no assignments to the biv within the
5733              giv's lifetime.  This requires two separate checks.  */
5734
5735           /* Check each biv update, and fail if any are between the first
5736              and last use of the giv.
5737
5738              If this loop contains an inner loop that was unrolled, then
5739              the insn modifying the biv may have been emitted by the loop
5740              unrolling code, and hence does not have a valid luid.  Just
5741              mark the biv as not replaceable in this case.  It is not very
5742              useful as a biv, because it is used in two different loops.
5743              It is very unlikely that we would be able to optimize the giv
5744              using this biv anyways.  */
5745
5746           v->replaceable = 1;
5747           for (b = bl->biv; b; b = b->next_iv)
5748             {
5749               if (INSN_UID (b->insn) >= max_uid_for_loop
5750                   || ((INSN_LUID (b->insn)
5751                        >= REGNO_FIRST_LUID (REGNO (dest_reg)))
5752                       && (INSN_LUID (b->insn)
5753                           <= REGNO_LAST_LUID (REGNO (dest_reg)))))
5754                 {
5755                   v->replaceable = 0;
5756                   v->not_replaceable = 1;
5757                   break;
5758                 }
5759             }
5760
5761           /* If there are any backwards branches that go from after the
5762              biv update to before it, then this giv is not replaceable.  */
5763           if (v->replaceable)
5764             for (b = bl->biv; b; b = b->next_iv)
5765               if (back_branch_in_range_p (loop, b->insn))
5766                 {
5767                   v->replaceable = 0;
5768                   v->not_replaceable = 1;
5769                   break;
5770                 }
5771         }
5772       else
5773         {
5774           /* May still be replaceable, we don't have enough info here to
5775              decide.  */
5776           v->replaceable = 0;
5777           v->not_replaceable = 0;
5778         }
5779     }
5780
5781   /* Record whether the add_val contains a const_int, for later use by
5782      combine_givs.  */
5783   {
5784     rtx tem = add_val;
5785
5786     v->no_const_addval = 1;
5787     if (tem == const0_rtx)
5788       ;
5789     else if (CONSTANT_P (add_val))
5790       v->no_const_addval = 0;
5791     if (GET_CODE (tem) == PLUS)
5792       {
5793         while (1)
5794           {
5795             if (GET_CODE (XEXP (tem, 0)) == PLUS)
5796               tem = XEXP (tem, 0);
5797             else if (GET_CODE (XEXP (tem, 1)) == PLUS)
5798               tem = XEXP (tem, 1);
5799             else
5800               break;
5801           }
5802         if (CONSTANT_P (XEXP (tem, 1)))
5803           v->no_const_addval = 0;
5804       }
5805   }
5806
5807   if (loop_dump_stream)
5808     loop_giv_dump (v, loop_dump_stream, 0);
5809 }
5810
5811 /* All this does is determine whether a giv can be made replaceable because
5812    its final value can be calculated.  This code can not be part of record_giv
5813    above, because final_giv_value requires that the number of loop iterations
5814    be known, and that can not be accurately calculated until after all givs
5815    have been identified.  */
5816
5817 static void
5818 check_final_value (loop, v)
5819      const struct loop *loop;
5820      struct induction *v;
5821 {
5822   struct loop_ivs *ivs = LOOP_IVS (loop);
5823   struct iv_class *bl;
5824   rtx final_value = 0;
5825
5826   bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
5827
5828   /* DEST_ADDR givs will never reach here, because they are always marked
5829      replaceable above in record_giv.  */
5830
5831   /* The giv can be replaced outright by the reduced register only if all
5832      of the following conditions are true:
5833      - the insn that sets the giv is always executed on any iteration
5834        on which the giv is used at all
5835        (there are two ways to deduce this:
5836         either the insn is executed on every iteration,
5837         or all uses follow that insn in the same basic block),
5838      - its final value can be calculated (this condition is different
5839        than the one above in record_giv)
5840      - it's not used before the it's set
5841      - no assignments to the biv occur during the giv's lifetime.  */
5842
5843 #if 0
5844   /* This is only called now when replaceable is known to be false.  */
5845   /* Clear replaceable, so that it won't confuse final_giv_value.  */
5846   v->replaceable = 0;
5847 #endif
5848
5849   if ((final_value = final_giv_value (loop, v))
5850       && (v->always_computable || last_use_this_basic_block (v->dest_reg, v->insn)))
5851     {
5852       int biv_increment_seen = 0, before_giv_insn = 0;
5853       rtx p = v->insn;
5854       rtx last_giv_use;
5855
5856       v->replaceable = 1;
5857
5858       /* When trying to determine whether or not a biv increment occurs
5859          during the lifetime of the giv, we can ignore uses of the variable
5860          outside the loop because final_value is true.  Hence we can not
5861          use regno_last_uid and regno_first_uid as above in record_giv.  */
5862
5863       /* Search the loop to determine whether any assignments to the
5864          biv occur during the giv's lifetime.  Start with the insn
5865          that sets the giv, and search around the loop until we come
5866          back to that insn again.
5867
5868          Also fail if there is a jump within the giv's lifetime that jumps
5869          to somewhere outside the lifetime but still within the loop.  This
5870          catches spaghetti code where the execution order is not linear, and
5871          hence the above test fails.  Here we assume that the giv lifetime
5872          does not extend from one iteration of the loop to the next, so as
5873          to make the test easier.  Since the lifetime isn't known yet,
5874          this requires two loops.  See also record_giv above.  */
5875
5876       last_giv_use = v->insn;
5877
5878       while (1)
5879         {
5880           p = NEXT_INSN (p);
5881           if (p == loop->end)
5882             {
5883               before_giv_insn = 1;
5884               p = NEXT_INSN (loop->start);
5885             }
5886           if (p == v->insn)
5887             break;
5888
5889           if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
5890               || GET_CODE (p) == CALL_INSN)
5891             {
5892               /* It is possible for the BIV increment to use the GIV if we
5893                  have a cycle.  Thus we must be sure to check each insn for
5894                  both BIV and GIV uses, and we must check for BIV uses
5895                  first.  */
5896
5897               if (! biv_increment_seen
5898                   && reg_set_p (v->src_reg, PATTERN (p)))
5899                 biv_increment_seen = 1;
5900
5901               if (reg_mentioned_p (v->dest_reg, PATTERN (p)))
5902                 {
5903                   if (biv_increment_seen || before_giv_insn)
5904                     {
5905                       v->replaceable = 0;
5906                       v->not_replaceable = 1;
5907                       break;
5908                     }
5909                   last_giv_use = p;
5910                 }
5911             }
5912         }
5913
5914       /* Now that the lifetime of the giv is known, check for branches
5915          from within the lifetime to outside the lifetime if it is still
5916          replaceable.  */
5917
5918       if (v->replaceable)
5919         {
5920           p = v->insn;
5921           while (1)
5922             {
5923               p = NEXT_INSN (p);
5924               if (p == loop->end)
5925                 p = NEXT_INSN (loop->start);
5926               if (p == last_giv_use)
5927                 break;
5928
5929               if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p)
5930                   && LABEL_NAME (JUMP_LABEL (p))
5931                   && ((loop_insn_first_p (JUMP_LABEL (p), v->insn)
5932                        && loop_insn_first_p (loop->start, JUMP_LABEL (p)))
5933                       || (loop_insn_first_p (last_giv_use, JUMP_LABEL (p))
5934                           && loop_insn_first_p (JUMP_LABEL (p), loop->end))))
5935                 {
5936                   v->replaceable = 0;
5937                   v->not_replaceable = 1;
5938
5939                   if (loop_dump_stream)
5940                     fprintf (loop_dump_stream,
5941                              "Found branch outside giv lifetime.\n");
5942
5943                   break;
5944                 }
5945             }
5946         }
5947
5948       /* If it is replaceable, then save the final value.  */
5949       if (v->replaceable)
5950         v->final_value = final_value;
5951     }
5952
5953   if (loop_dump_stream && v->replaceable)
5954     fprintf (loop_dump_stream, "Insn %d: giv reg %d final_value replaceable\n",
5955              INSN_UID (v->insn), REGNO (v->dest_reg));
5956 }
5957 \f
5958 /* Update the status of whether a giv can derive other givs.
5959
5960    We need to do something special if there is or may be an update to the biv
5961    between the time the giv is defined and the time it is used to derive
5962    another giv.
5963
5964    In addition, a giv that is only conditionally set is not allowed to
5965    derive another giv once a label has been passed.
5966
5967    The cases we look at are when a label or an update to a biv is passed.  */
5968
5969 static void
5970 update_giv_derive (loop, p)
5971      const struct loop *loop;
5972      rtx p;
5973 {
5974   struct loop_ivs *ivs = LOOP_IVS (loop);
5975   struct iv_class *bl;
5976   struct induction *biv, *giv;
5977   rtx tem;
5978   int dummy;
5979
5980   /* Search all IV classes, then all bivs, and finally all givs.
5981
5982      There are three cases we are concerned with.  First we have the situation
5983      of a giv that is only updated conditionally.  In that case, it may not
5984      derive any givs after a label is passed.
5985
5986      The second case is when a biv update occurs, or may occur, after the
5987      definition of a giv.  For certain biv updates (see below) that are
5988      known to occur between the giv definition and use, we can adjust the
5989      giv definition.  For others, or when the biv update is conditional,
5990      we must prevent the giv from deriving any other givs.  There are two
5991      sub-cases within this case.
5992
5993      If this is a label, we are concerned with any biv update that is done
5994      conditionally, since it may be done after the giv is defined followed by
5995      a branch here (actually, we need to pass both a jump and a label, but
5996      this extra tracking doesn't seem worth it).
5997
5998      If this is a jump, we are concerned about any biv update that may be
5999      executed multiple times.  We are actually only concerned about
6000      backward jumps, but it is probably not worth performing the test
6001      on the jump again here.
6002
6003      If this is a biv update, we must adjust the giv status to show that a
6004      subsequent biv update was performed.  If this adjustment cannot be done,
6005      the giv cannot derive further givs.  */
6006
6007   for (bl = ivs->list; bl; bl = bl->next)
6008     for (biv = bl->biv; biv; biv = biv->next_iv)
6009       if (GET_CODE (p) == CODE_LABEL || GET_CODE (p) == JUMP_INSN
6010           || biv->insn == p)
6011         {
6012           for (giv = bl->giv; giv; giv = giv->next_iv)
6013             {
6014               /* If cant_derive is already true, there is no point in
6015                  checking all of these conditions again.  */
6016               if (giv->cant_derive)
6017                 continue;
6018
6019               /* If this giv is conditionally set and we have passed a label,
6020                  it cannot derive anything.  */
6021               if (GET_CODE (p) == CODE_LABEL && ! giv->always_computable)
6022                 giv->cant_derive = 1;
6023
6024               /* Skip givs that have mult_val == 0, since
6025                  they are really invariants.  Also skip those that are
6026                  replaceable, since we know their lifetime doesn't contain
6027                  any biv update.  */
6028               else if (giv->mult_val == const0_rtx || giv->replaceable)
6029                 continue;
6030
6031               /* The only way we can allow this giv to derive another
6032                  is if this is a biv increment and we can form the product
6033                  of biv->add_val and giv->mult_val.  In this case, we will
6034                  be able to compute a compensation.  */
6035               else if (biv->insn == p)
6036                 {
6037                   rtx ext_val_dummy;
6038
6039                   tem = 0;
6040                   if (biv->mult_val == const1_rtx)
6041                     tem = simplify_giv_expr (loop,
6042                                              gen_rtx_MULT (giv->mode,
6043                                                            biv->add_val,
6044                                                            giv->mult_val),
6045                                              &ext_val_dummy, &dummy);
6046
6047                   if (tem && giv->derive_adjustment)
6048                     tem = simplify_giv_expr
6049                       (loop,
6050                        gen_rtx_PLUS (giv->mode, tem, giv->derive_adjustment),
6051                        &ext_val_dummy, &dummy);
6052
6053                   if (tem)
6054                     giv->derive_adjustment = tem;
6055                   else
6056                     giv->cant_derive = 1;
6057                 }
6058               else if ((GET_CODE (p) == CODE_LABEL && ! biv->always_computable)
6059                        || (GET_CODE (p) == JUMP_INSN && biv->maybe_multiple))
6060                 giv->cant_derive = 1;
6061             }
6062         }
6063 }
6064 \f
6065 /* Check whether an insn is an increment legitimate for a basic induction var.
6066    X is the source of insn P, or a part of it.
6067    MODE is the mode in which X should be interpreted.
6068
6069    DEST_REG is the putative biv, also the destination of the insn.
6070    We accept patterns of these forms:
6071      REG = REG + INVARIANT (includes REG = REG - CONSTANT)
6072      REG = INVARIANT + REG
6073
6074    If X is suitable, we return 1, set *MULT_VAL to CONST1_RTX,
6075    store the additive term into *INC_VAL, and store the place where
6076    we found the additive term into *LOCATION.
6077
6078    If X is an assignment of an invariant into DEST_REG, we set
6079    *MULT_VAL to CONST0_RTX, and store the invariant into *INC_VAL.
6080
6081    We also want to detect a BIV when it corresponds to a variable
6082    whose mode was promoted via PROMOTED_MODE.  In that case, an increment
6083    of the variable may be a PLUS that adds a SUBREG of that variable to
6084    an invariant and then sign- or zero-extends the result of the PLUS
6085    into the variable.
6086
6087    Most GIVs in such cases will be in the promoted mode, since that is the
6088    probably the natural computation mode (and almost certainly the mode
6089    used for addresses) on the machine.  So we view the pseudo-reg containing
6090    the variable as the BIV, as if it were simply incremented.
6091
6092    Note that treating the entire pseudo as a BIV will result in making
6093    simple increments to any GIVs based on it.  However, if the variable
6094    overflows in its declared mode but not its promoted mode, the result will
6095    be incorrect.  This is acceptable if the variable is signed, since
6096    overflows in such cases are undefined, but not if it is unsigned, since
6097    those overflows are defined.  So we only check for SIGN_EXTEND and
6098    not ZERO_EXTEND.
6099
6100    If we cannot find a biv, we return 0.  */
6101
6102 static int
6103 basic_induction_var (loop, x, mode, dest_reg, p, inc_val, mult_val, location)
6104      const struct loop *loop;
6105      rtx x;
6106      enum machine_mode mode;
6107      rtx dest_reg;
6108      rtx p;
6109      rtx *inc_val;
6110      rtx *mult_val;
6111      rtx **location;
6112 {
6113   enum rtx_code code;
6114   rtx *argp, arg;
6115   rtx insn, set = 0;
6116
6117   code = GET_CODE (x);
6118   *location = NULL;
6119   switch (code)
6120     {
6121     case PLUS:
6122       if (rtx_equal_p (XEXP (x, 0), dest_reg)
6123           || (GET_CODE (XEXP (x, 0)) == SUBREG
6124               && SUBREG_PROMOTED_VAR_P (XEXP (x, 0))
6125               && SUBREG_REG (XEXP (x, 0)) == dest_reg))
6126         {
6127           argp = &XEXP (x, 1);
6128         }
6129       else if (rtx_equal_p (XEXP (x, 1), dest_reg)
6130                || (GET_CODE (XEXP (x, 1)) == SUBREG
6131                    && SUBREG_PROMOTED_VAR_P (XEXP (x, 1))
6132                    && SUBREG_REG (XEXP (x, 1)) == dest_reg))
6133         {
6134           argp = &XEXP (x, 0);
6135         }
6136       else
6137         return 0;
6138
6139       arg = *argp;
6140       if (loop_invariant_p (loop, arg) != 1)
6141         return 0;
6142
6143       *inc_val = convert_modes (GET_MODE (dest_reg), GET_MODE (x), arg, 0);
6144       *mult_val = const1_rtx;
6145       *location = argp;
6146       return 1;
6147
6148     case SUBREG:
6149       /* If what's inside the SUBREG is a BIV, then the SUBREG.  This will
6150          handle addition of promoted variables.
6151          ??? The comment at the start of this function is wrong: promoted
6152          variable increments don't look like it says they do.  */
6153       return basic_induction_var (loop, SUBREG_REG (x),
6154                                   GET_MODE (SUBREG_REG (x)),
6155                                   dest_reg, p, inc_val, mult_val, location);
6156
6157     case REG:
6158       /* If this register is assigned in a previous insn, look at its
6159          source, but don't go outside the loop or past a label.  */
6160
6161       /* If this sets a register to itself, we would repeat any previous
6162          biv increment if we applied this strategy blindly.  */
6163       if (rtx_equal_p (dest_reg, x))
6164         return 0;
6165
6166       insn = p;
6167       while (1)
6168         {
6169           rtx dest;
6170           do
6171             {
6172               insn = PREV_INSN (insn);
6173             }
6174           while (insn && GET_CODE (insn) == NOTE
6175                  && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
6176
6177           if (!insn)
6178             break;
6179           set = single_set (insn);
6180           if (set == 0)
6181             break;
6182           dest = SET_DEST (set);
6183           if (dest == x
6184               || (GET_CODE (dest) == SUBREG
6185                   && (GET_MODE_SIZE (GET_MODE (dest)) <= UNITS_PER_WORD)
6186                   && (GET_MODE_CLASS (GET_MODE (dest)) == MODE_INT)
6187                   && SUBREG_REG (dest) == x))
6188             return basic_induction_var (loop, SET_SRC (set),
6189                                         (GET_MODE (SET_SRC (set)) == VOIDmode
6190                                          ? GET_MODE (x)
6191                                          : GET_MODE (SET_SRC (set))),
6192                                         dest_reg, insn,
6193                                         inc_val, mult_val, location);
6194
6195           while (GET_CODE (dest) == SIGN_EXTRACT
6196                  || GET_CODE (dest) == ZERO_EXTRACT
6197                  || GET_CODE (dest) == SUBREG
6198                  || GET_CODE (dest) == STRICT_LOW_PART)
6199             dest = XEXP (dest, 0);
6200           if (dest == x)
6201             break;
6202         }
6203       /* Fall through.  */
6204
6205       /* Can accept constant setting of biv only when inside inner most loop.
6206          Otherwise, a biv of an inner loop may be incorrectly recognized
6207          as a biv of the outer loop,
6208          causing code to be moved INTO the inner loop.  */
6209     case MEM:
6210       if (loop_invariant_p (loop, x) != 1)
6211         return 0;
6212     case CONST_INT:
6213     case SYMBOL_REF:
6214     case CONST:
6215       /* convert_modes aborts if we try to convert to or from CCmode, so just
6216          exclude that case.  It is very unlikely that a condition code value
6217          would be a useful iterator anyways.  */
6218       if (loop->level == 1
6219           && GET_MODE_CLASS (mode) != MODE_CC
6220           && GET_MODE_CLASS (GET_MODE (dest_reg)) != MODE_CC)
6221         {
6222           /* Possible bug here?  Perhaps we don't know the mode of X.  */
6223           *inc_val = convert_modes (GET_MODE (dest_reg), mode, x, 0);
6224           *mult_val = const0_rtx;
6225           return 1;
6226         }
6227       else
6228         return 0;
6229
6230     case SIGN_EXTEND:
6231       return basic_induction_var (loop, XEXP (x, 0), GET_MODE (XEXP (x, 0)),
6232                                   dest_reg, p, inc_val, mult_val, location);
6233
6234     case ASHIFTRT:
6235       /* Similar, since this can be a sign extension.  */
6236       for (insn = PREV_INSN (p);
6237            (insn && GET_CODE (insn) == NOTE
6238             && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
6239            insn = PREV_INSN (insn))
6240         ;
6241
6242       if (insn)
6243         set = single_set (insn);
6244
6245       if (! rtx_equal_p (dest_reg, XEXP (x, 0))
6246           && set && SET_DEST (set) == XEXP (x, 0)
6247           && GET_CODE (XEXP (x, 1)) == CONST_INT
6248           && INTVAL (XEXP (x, 1)) >= 0
6249           && GET_CODE (SET_SRC (set)) == ASHIFT
6250           && XEXP (x, 1) == XEXP (SET_SRC (set), 1))
6251         return basic_induction_var (loop, XEXP (SET_SRC (set), 0),
6252                                     GET_MODE (XEXP (x, 0)),
6253                                     dest_reg, insn, inc_val, mult_val,
6254                                     location);
6255       return 0;
6256
6257     default:
6258       return 0;
6259     }
6260 }
6261 \f
6262 /* A general induction variable (giv) is any quantity that is a linear
6263    function   of a basic induction variable,
6264    i.e. giv = biv * mult_val + add_val.
6265    The coefficients can be any loop invariant quantity.
6266    A giv need not be computed directly from the biv;
6267    it can be computed by way of other givs.  */
6268
6269 /* Determine whether X computes a giv.
6270    If it does, return a nonzero value
6271      which is the benefit from eliminating the computation of X;
6272    set *SRC_REG to the register of the biv that it is computed from;
6273    set *ADD_VAL and *MULT_VAL to the coefficients,
6274      such that the value of X is biv * mult + add;  */
6275
6276 static int
6277 general_induction_var (loop, x, src_reg, add_val, mult_val, ext_val,
6278                        is_addr, pbenefit, addr_mode)
6279      const struct loop *loop;
6280      rtx x;
6281      rtx *src_reg;
6282      rtx *add_val;
6283      rtx *mult_val;
6284      rtx *ext_val;
6285      int is_addr;
6286      int *pbenefit;
6287      enum machine_mode addr_mode;
6288 {
6289   struct loop_ivs *ivs = LOOP_IVS (loop);
6290   rtx orig_x = x;
6291
6292   /* If this is an invariant, forget it, it isn't a giv.  */
6293   if (loop_invariant_p (loop, x) == 1)
6294     return 0;
6295
6296   *pbenefit = 0;
6297   *ext_val = NULL_RTX;
6298   x = simplify_giv_expr (loop, x, ext_val, pbenefit);
6299   if (x == 0)
6300     return 0;
6301
6302   switch (GET_CODE (x))
6303     {
6304     case USE:
6305     case CONST_INT:
6306       /* Since this is now an invariant and wasn't before, it must be a giv
6307          with MULT_VAL == 0.  It doesn't matter which BIV we associate this
6308          with.  */
6309       *src_reg = ivs->list->biv->dest_reg;
6310       *mult_val = const0_rtx;
6311       *add_val = x;
6312       break;
6313
6314     case REG:
6315       /* This is equivalent to a BIV.  */
6316       *src_reg = x;
6317       *mult_val = const1_rtx;
6318       *add_val = const0_rtx;
6319       break;
6320
6321     case PLUS:
6322       /* Either (plus (biv) (invar)) or
6323          (plus (mult (biv) (invar_1)) (invar_2)).  */
6324       if (GET_CODE (XEXP (x, 0)) == MULT)
6325         {
6326           *src_reg = XEXP (XEXP (x, 0), 0);
6327           *mult_val = XEXP (XEXP (x, 0), 1);
6328         }
6329       else
6330         {
6331           *src_reg = XEXP (x, 0);
6332           *mult_val = const1_rtx;
6333         }
6334       *add_val = XEXP (x, 1);
6335       break;
6336
6337     case MULT:
6338       /* ADD_VAL is zero.  */
6339       *src_reg = XEXP (x, 0);
6340       *mult_val = XEXP (x, 1);
6341       *add_val = const0_rtx;
6342       break;
6343
6344     default:
6345       abort ();
6346     }
6347
6348   /* Remove any enclosing USE from ADD_VAL and MULT_VAL (there will be
6349      unless they are CONST_INT).  */
6350   if (GET_CODE (*add_val) == USE)
6351     *add_val = XEXP (*add_val, 0);
6352   if (GET_CODE (*mult_val) == USE)
6353     *mult_val = XEXP (*mult_val, 0);
6354
6355   if (is_addr)
6356     *pbenefit += address_cost (orig_x, addr_mode) - reg_address_cost;
6357   else
6358     *pbenefit += rtx_cost (orig_x, SET);
6359
6360   /* Always return true if this is a giv so it will be detected as such,
6361      even if the benefit is zero or negative.  This allows elimination
6362      of bivs that might otherwise not be eliminated.  */
6363   return 1;
6364 }
6365 \f
6366 /* Given an expression, X, try to form it as a linear function of a biv.
6367    We will canonicalize it to be of the form
6368         (plus (mult (BIV) (invar_1))
6369               (invar_2))
6370    with possible degeneracies.
6371
6372    The invariant expressions must each be of a form that can be used as a
6373    machine operand.  We surround then with a USE rtx (a hack, but localized
6374    and certainly unambiguous!) if not a CONST_INT for simplicity in this
6375    routine; it is the caller's responsibility to strip them.
6376
6377    If no such canonicalization is possible (i.e., two biv's are used or an
6378    expression that is neither invariant nor a biv or giv), this routine
6379    returns 0.
6380
6381    For a non-zero return, the result will have a code of CONST_INT, USE,
6382    REG (for a BIV), PLUS, or MULT.  No other codes will occur.
6383
6384    *BENEFIT will be incremented by the benefit of any sub-giv encountered.  */
6385
6386 static rtx sge_plus PARAMS ((enum machine_mode, rtx, rtx));
6387 static rtx sge_plus_constant PARAMS ((rtx, rtx));
6388
6389 static rtx
6390 simplify_giv_expr (loop, x, ext_val, benefit)
6391      const struct loop *loop;
6392      rtx x;
6393      rtx *ext_val;
6394      int *benefit;
6395 {
6396   struct loop_ivs *ivs = LOOP_IVS (loop);
6397   struct loop_regs *regs = LOOP_REGS (loop);
6398   enum machine_mode mode = GET_MODE (x);
6399   rtx arg0, arg1;
6400   rtx tem;
6401
6402   /* If this is not an integer mode, or if we cannot do arithmetic in this
6403      mode, this can't be a giv.  */
6404   if (mode != VOIDmode
6405       && (GET_MODE_CLASS (mode) != MODE_INT
6406           || GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT))
6407     return NULL_RTX;
6408
6409   switch (GET_CODE (x))
6410     {
6411     case PLUS:
6412       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6413       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
6414       if (arg0 == 0 || arg1 == 0)
6415         return NULL_RTX;
6416
6417       /* Put constant last, CONST_INT last if both constant.  */
6418       if ((GET_CODE (arg0) == USE
6419            || GET_CODE (arg0) == CONST_INT)
6420           && ! ((GET_CODE (arg0) == USE
6421                  && GET_CODE (arg1) == USE)
6422                 || GET_CODE (arg1) == CONST_INT))
6423         tem = arg0, arg0 = arg1, arg1 = tem;
6424
6425       /* Handle addition of zero, then addition of an invariant.  */
6426       if (arg1 == const0_rtx)
6427         return arg0;
6428       else if (GET_CODE (arg1) == CONST_INT || GET_CODE (arg1) == USE)
6429         switch (GET_CODE (arg0))
6430           {
6431           case CONST_INT:
6432           case USE:
6433             /* Adding two invariants must result in an invariant, so enclose
6434                addition operation inside a USE and return it.  */
6435             if (GET_CODE (arg0) == USE)
6436               arg0 = XEXP (arg0, 0);
6437             if (GET_CODE (arg1) == USE)
6438               arg1 = XEXP (arg1, 0);
6439
6440             if (GET_CODE (arg0) == CONST_INT)
6441               tem = arg0, arg0 = arg1, arg1 = tem;
6442             if (GET_CODE (arg1) == CONST_INT)
6443               tem = sge_plus_constant (arg0, arg1);
6444             else
6445               tem = sge_plus (mode, arg0, arg1);
6446
6447             if (GET_CODE (tem) != CONST_INT)
6448               tem = gen_rtx_USE (mode, tem);
6449             return tem;
6450
6451           case REG:
6452           case MULT:
6453             /* biv + invar or mult + invar.  Return sum.  */
6454             return gen_rtx_PLUS (mode, arg0, arg1);
6455
6456           case PLUS:
6457             /* (a + invar_1) + invar_2.  Associate.  */
6458             return
6459               simplify_giv_expr (loop,
6460                                  gen_rtx_PLUS (mode,
6461                                                XEXP (arg0, 0),
6462                                                gen_rtx_PLUS (mode,
6463                                                              XEXP (arg0, 1),
6464                                                              arg1)),
6465                                  ext_val, benefit);
6466
6467           default:
6468             abort ();
6469           }
6470
6471       /* Each argument must be either REG, PLUS, or MULT.  Convert REG to
6472          MULT to reduce cases.  */
6473       if (GET_CODE (arg0) == REG)
6474         arg0 = gen_rtx_MULT (mode, arg0, const1_rtx);
6475       if (GET_CODE (arg1) == REG)
6476         arg1 = gen_rtx_MULT (mode, arg1, const1_rtx);
6477
6478       /* Now have PLUS + PLUS, PLUS + MULT, MULT + PLUS, or MULT + MULT.
6479          Put a MULT first, leaving PLUS + PLUS, MULT + PLUS, or MULT + MULT.
6480          Recurse to associate the second PLUS.  */
6481       if (GET_CODE (arg1) == MULT)
6482         tem = arg0, arg0 = arg1, arg1 = tem;
6483
6484       if (GET_CODE (arg1) == PLUS)
6485         return
6486           simplify_giv_expr (loop,
6487                              gen_rtx_PLUS (mode,
6488                                            gen_rtx_PLUS (mode, arg0,
6489                                                          XEXP (arg1, 0)),
6490                                            XEXP (arg1, 1)),
6491                              ext_val, benefit);
6492
6493       /* Now must have MULT + MULT.  Distribute if same biv, else not giv.  */
6494       if (GET_CODE (arg0) != MULT || GET_CODE (arg1) != MULT)
6495         return NULL_RTX;
6496
6497       if (!rtx_equal_p (arg0, arg1))
6498         return NULL_RTX;
6499
6500       return simplify_giv_expr (loop,
6501                                 gen_rtx_MULT (mode,
6502                                               XEXP (arg0, 0),
6503                                               gen_rtx_PLUS (mode,
6504                                                             XEXP (arg0, 1),
6505                                                             XEXP (arg1, 1))),
6506                                 ext_val, benefit);
6507
6508     case MINUS:
6509       /* Handle "a - b" as "a + b * (-1)".  */
6510       return simplify_giv_expr (loop,
6511                                 gen_rtx_PLUS (mode,
6512                                               XEXP (x, 0),
6513                                               gen_rtx_MULT (mode,
6514                                                             XEXP (x, 1),
6515                                                             constm1_rtx)),
6516                                 ext_val, benefit);
6517
6518     case MULT:
6519       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6520       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
6521       if (arg0 == 0 || arg1 == 0)
6522         return NULL_RTX;
6523
6524       /* Put constant last, CONST_INT last if both constant.  */
6525       if ((GET_CODE (arg0) == USE || GET_CODE (arg0) == CONST_INT)
6526           && GET_CODE (arg1) != CONST_INT)
6527         tem = arg0, arg0 = arg1, arg1 = tem;
6528
6529       /* If second argument is not now constant, not giv.  */
6530       if (GET_CODE (arg1) != USE && GET_CODE (arg1) != CONST_INT)
6531         return NULL_RTX;
6532
6533       /* Handle multiply by 0 or 1.  */
6534       if (arg1 == const0_rtx)
6535         return const0_rtx;
6536
6537       else if (arg1 == const1_rtx)
6538         return arg0;
6539
6540       switch (GET_CODE (arg0))
6541         {
6542         case REG:
6543           /* biv * invar.  Done.  */
6544           return gen_rtx_MULT (mode, arg0, arg1);
6545
6546         case CONST_INT:
6547           /* Product of two constants.  */
6548           return GEN_INT (INTVAL (arg0) * INTVAL (arg1));
6549
6550         case USE:
6551           /* invar * invar is a giv, but attempt to simplify it somehow.  */
6552           if (GET_CODE (arg1) != CONST_INT)
6553             return NULL_RTX;
6554
6555           arg0 = XEXP (arg0, 0);
6556           if (GET_CODE (arg0) == MULT)
6557             {
6558               /* (invar_0 * invar_1) * invar_2.  Associate.  */
6559               return simplify_giv_expr (loop,
6560                                         gen_rtx_MULT (mode,
6561                                                       XEXP (arg0, 0),
6562                                                       gen_rtx_MULT (mode,
6563                                                                     XEXP (arg0,
6564                                                                           1),
6565                                                                     arg1)),
6566                                         ext_val, benefit);
6567             }
6568           /* Porpagate the MULT expressions to the intermost nodes.  */
6569           else if (GET_CODE (arg0) == PLUS)
6570             {
6571               /* (invar_0 + invar_1) * invar_2.  Distribute.  */
6572               return simplify_giv_expr (loop,
6573                                         gen_rtx_PLUS (mode,
6574                                                       gen_rtx_MULT (mode,
6575                                                                     XEXP (arg0,
6576                                                                           0),
6577                                                                     arg1),
6578                                                       gen_rtx_MULT (mode,
6579                                                                     XEXP (arg0,
6580                                                                           1),
6581                                                                     arg1)),
6582                                         ext_val, benefit);
6583             }
6584           return gen_rtx_USE (mode, gen_rtx_MULT (mode, arg0, arg1));
6585
6586         case MULT:
6587           /* (a * invar_1) * invar_2.  Associate.  */
6588           return simplify_giv_expr (loop,
6589                                     gen_rtx_MULT (mode,
6590                                                   XEXP (arg0, 0),
6591                                                   gen_rtx_MULT (mode,
6592                                                                 XEXP (arg0, 1),
6593                                                                 arg1)),
6594                                     ext_val, benefit);
6595
6596         case PLUS:
6597           /* (a + invar_1) * invar_2.  Distribute.  */
6598           return simplify_giv_expr (loop,
6599                                     gen_rtx_PLUS (mode,
6600                                                   gen_rtx_MULT (mode,
6601                                                                 XEXP (arg0, 0),
6602                                                                 arg1),
6603                                                   gen_rtx_MULT (mode,
6604                                                                 XEXP (arg0, 1),
6605                                                                 arg1)),
6606                                     ext_val, benefit);
6607
6608         default:
6609           abort ();
6610         }
6611
6612     case ASHIFT:
6613       /* Shift by constant is multiply by power of two.  */
6614       if (GET_CODE (XEXP (x, 1)) != CONST_INT)
6615         return 0;
6616
6617       return
6618         simplify_giv_expr (loop,
6619                            gen_rtx_MULT (mode,
6620                                          XEXP (x, 0),
6621                                          GEN_INT ((HOST_WIDE_INT) 1
6622                                                   << INTVAL (XEXP (x, 1)))),
6623                            ext_val, benefit);
6624
6625     case NEG:
6626       /* "-a" is "a * (-1)" */
6627       return simplify_giv_expr (loop,
6628                                 gen_rtx_MULT (mode, XEXP (x, 0), constm1_rtx),
6629                                 ext_val, benefit);
6630
6631     case NOT:
6632       /* "~a" is "-a - 1". Silly, but easy.  */
6633       return simplify_giv_expr (loop,
6634                                 gen_rtx_MINUS (mode,
6635                                                gen_rtx_NEG (mode, XEXP (x, 0)),
6636                                                const1_rtx),
6637                                 ext_val, benefit);
6638
6639     case USE:
6640       /* Already in proper form for invariant.  */
6641       return x;
6642
6643     case SIGN_EXTEND:
6644     case ZERO_EXTEND:
6645     case TRUNCATE:
6646       /* Conditionally recognize extensions of simple IVs.  After we've
6647          computed loop traversal counts and verified the range of the
6648          source IV, we'll reevaluate this as a GIV.  */
6649       if (*ext_val == NULL_RTX)
6650         {
6651           arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6652           if (arg0 && *ext_val == NULL_RTX && GET_CODE (arg0) == REG)
6653             {
6654               *ext_val = gen_rtx_fmt_e (GET_CODE (x), mode, arg0);
6655               return arg0;
6656             }
6657         }
6658       goto do_default;
6659
6660     case REG:
6661       /* If this is a new register, we can't deal with it.  */
6662       if (REGNO (x) >= max_reg_before_loop)
6663         return 0;
6664
6665       /* Check for biv or giv.  */
6666       switch (REG_IV_TYPE (ivs, REGNO (x)))
6667         {
6668         case BASIC_INDUCT:
6669           return x;
6670         case GENERAL_INDUCT:
6671           {
6672             struct induction *v = REG_IV_INFO (ivs, REGNO (x));
6673
6674             /* Form expression from giv and add benefit.  Ensure this giv
6675                can derive another and subtract any needed adjustment if so.  */
6676
6677             /* Increasing the benefit here is risky.  The only case in which it
6678                is arguably correct is if this is the only use of V.  In other
6679                cases, this will artificially inflate the benefit of the current
6680                giv, and lead to suboptimal code.  Thus, it is disabled, since
6681                potentially not reducing an only marginally beneficial giv is
6682                less harmful than reducing many givs that are not really
6683                beneficial.  */
6684             {
6685               rtx single_use = regs->array[REGNO (x)].single_usage;
6686               if (single_use && single_use != const0_rtx)
6687                 *benefit += v->benefit;
6688             }
6689
6690             if (v->cant_derive)
6691               return 0;
6692
6693             tem = gen_rtx_PLUS (mode, gen_rtx_MULT (mode,
6694                                                     v->src_reg, v->mult_val),
6695                                 v->add_val);
6696
6697             if (v->derive_adjustment)
6698               tem = gen_rtx_MINUS (mode, tem, v->derive_adjustment);
6699             arg0 = simplify_giv_expr (loop, tem, ext_val, benefit);
6700             if (*ext_val)
6701               {
6702                 if (!v->ext_dependent)
6703                   return arg0;
6704               }
6705             else
6706               {
6707                 *ext_val = v->ext_dependent;
6708                 return arg0;
6709               }
6710             return 0;
6711           }
6712
6713         default:
6714         do_default:
6715           /* If it isn't an induction variable, and it is invariant, we
6716              may be able to simplify things further by looking through
6717              the bits we just moved outside the loop.  */
6718           if (loop_invariant_p (loop, x) == 1)
6719             {
6720               struct movable *m;
6721               struct loop_movables *movables = LOOP_MOVABLES (loop);
6722
6723               for (m = movables->head; m; m = m->next)
6724                 if (rtx_equal_p (x, m->set_dest))
6725                   {
6726                     /* Ok, we found a match.  Substitute and simplify.  */
6727
6728                     /* If we match another movable, we must use that, as
6729                        this one is going away.  */
6730                     if (m->match)
6731                       return simplify_giv_expr (loop, m->match->set_dest,
6732                                                 ext_val, benefit);
6733
6734                     /* If consec is non-zero, this is a member of a group of
6735                        instructions that were moved together.  We handle this
6736                        case only to the point of seeking to the last insn and
6737                        looking for a REG_EQUAL.  Fail if we don't find one.  */
6738                     if (m->consec != 0)
6739                       {
6740                         int i = m->consec;
6741                         tem = m->insn;
6742                         do
6743                           {
6744                             tem = NEXT_INSN (tem);
6745                           }
6746                         while (--i > 0);
6747
6748                         tem = find_reg_note (tem, REG_EQUAL, NULL_RTX);
6749                         if (tem)
6750                           tem = XEXP (tem, 0);
6751                       }
6752                     else
6753                       {
6754                         tem = single_set (m->insn);
6755                         if (tem)
6756                           tem = SET_SRC (tem);
6757                       }
6758
6759                     if (tem)
6760                       {
6761                         /* What we are most interested in is pointer
6762                            arithmetic on invariants -- only take
6763                            patterns we may be able to do something with.  */
6764                         if (GET_CODE (tem) == PLUS
6765                             || GET_CODE (tem) == MULT
6766                             || GET_CODE (tem) == ASHIFT
6767                             || GET_CODE (tem) == CONST_INT
6768                             || GET_CODE (tem) == SYMBOL_REF)
6769                           {
6770                             tem = simplify_giv_expr (loop, tem, ext_val,
6771                                                      benefit);
6772                             if (tem)
6773                               return tem;
6774                           }
6775                         else if (GET_CODE (tem) == CONST
6776                                  && GET_CODE (XEXP (tem, 0)) == PLUS
6777                                  && GET_CODE (XEXP (XEXP (tem, 0), 0)) == SYMBOL_REF
6778                                  && GET_CODE (XEXP (XEXP (tem, 0), 1)) == CONST_INT)
6779                           {
6780                             tem = simplify_giv_expr (loop, XEXP (tem, 0),
6781                                                      ext_val, benefit);
6782                             if (tem)
6783                               return tem;
6784                           }
6785                       }
6786                     break;
6787                   }
6788             }
6789           break;
6790         }
6791
6792       /* Fall through to general case.  */
6793     default:
6794       /* If invariant, return as USE (unless CONST_INT).
6795          Otherwise, not giv.  */
6796       if (GET_CODE (x) == USE)
6797         x = XEXP (x, 0);
6798
6799       if (loop_invariant_p (loop, x) == 1)
6800         {
6801           if (GET_CODE (x) == CONST_INT)
6802             return x;
6803           if (GET_CODE (x) == CONST
6804               && GET_CODE (XEXP (x, 0)) == PLUS
6805               && GET_CODE (XEXP (XEXP (x, 0), 0)) == SYMBOL_REF
6806               && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)
6807             x = XEXP (x, 0);
6808           return gen_rtx_USE (mode, x);
6809         }
6810       else
6811         return 0;
6812     }
6813 }
6814
6815 /* This routine folds invariants such that there is only ever one
6816    CONST_INT in the summation.  It is only used by simplify_giv_expr.  */
6817
6818 static rtx
6819 sge_plus_constant (x, c)
6820      rtx x, c;
6821 {
6822   if (GET_CODE (x) == CONST_INT)
6823     return GEN_INT (INTVAL (x) + INTVAL (c));
6824   else if (GET_CODE (x) != PLUS)
6825     return gen_rtx_PLUS (GET_MODE (x), x, c);
6826   else if (GET_CODE (XEXP (x, 1)) == CONST_INT)
6827     {
6828       return gen_rtx_PLUS (GET_MODE (x), XEXP (x, 0),
6829                            GEN_INT (INTVAL (XEXP (x, 1)) + INTVAL (c)));
6830     }
6831   else if (GET_CODE (XEXP (x, 0)) == PLUS
6832            || GET_CODE (XEXP (x, 1)) != PLUS)
6833     {
6834       return gen_rtx_PLUS (GET_MODE (x),
6835                            sge_plus_constant (XEXP (x, 0), c), XEXP (x, 1));
6836     }
6837   else
6838     {
6839       return gen_rtx_PLUS (GET_MODE (x),
6840                            sge_plus_constant (XEXP (x, 1), c), XEXP (x, 0));
6841     }
6842 }
6843
6844 static rtx
6845 sge_plus (mode, x, y)
6846      enum machine_mode mode;
6847      rtx x, y;
6848 {
6849   while (GET_CODE (y) == PLUS)
6850     {
6851       rtx a = XEXP (y, 0);
6852       if (GET_CODE (a) == CONST_INT)
6853         x = sge_plus_constant (x, a);
6854       else
6855         x = gen_rtx_PLUS (mode, x, a);
6856       y = XEXP (y, 1);
6857     }
6858   if (GET_CODE (y) == CONST_INT)
6859     x = sge_plus_constant (x, y);
6860   else
6861     x = gen_rtx_PLUS (mode, x, y);
6862   return x;
6863 }
6864 \f
6865 /* Help detect a giv that is calculated by several consecutive insns;
6866    for example,
6867       giv = biv * M
6868       giv = giv + A
6869    The caller has already identified the first insn P as having a giv as dest;
6870    we check that all other insns that set the same register follow
6871    immediately after P, that they alter nothing else,
6872    and that the result of the last is still a giv.
6873
6874    The value is 0 if the reg set in P is not really a giv.
6875    Otherwise, the value is the amount gained by eliminating
6876    all the consecutive insns that compute the value.
6877
6878    FIRST_BENEFIT is the amount gained by eliminating the first insn, P.
6879    SRC_REG is the reg of the biv; DEST_REG is the reg of the giv.
6880
6881    The coefficients of the ultimate giv value are stored in
6882    *MULT_VAL and *ADD_VAL.  */
6883
6884 static int
6885 consec_sets_giv (loop, first_benefit, p, src_reg, dest_reg,
6886                  add_val, mult_val, ext_val, last_consec_insn)
6887      const struct loop *loop;
6888      int first_benefit;
6889      rtx p;
6890      rtx src_reg;
6891      rtx dest_reg;
6892      rtx *add_val;
6893      rtx *mult_val;
6894      rtx *ext_val;
6895      rtx *last_consec_insn;
6896 {
6897   struct loop_ivs *ivs = LOOP_IVS (loop);
6898   struct loop_regs *regs = LOOP_REGS (loop);
6899   int count;
6900   enum rtx_code code;
6901   int benefit;
6902   rtx temp;
6903   rtx set;
6904
6905   /* Indicate that this is a giv so that we can update the value produced in
6906      each insn of the multi-insn sequence.
6907
6908      This induction structure will be used only by the call to
6909      general_induction_var below, so we can allocate it on our stack.
6910      If this is a giv, our caller will replace the induct var entry with
6911      a new induction structure.  */
6912   struct induction *v;
6913
6914   if (REG_IV_TYPE (ivs, REGNO (dest_reg)) != UNKNOWN_INDUCT)
6915     return 0;
6916
6917   v = (struct induction *) alloca (sizeof (struct induction));
6918   v->src_reg = src_reg;
6919   v->mult_val = *mult_val;
6920   v->add_val = *add_val;
6921   v->benefit = first_benefit;
6922   v->cant_derive = 0;
6923   v->derive_adjustment = 0;
6924   v->ext_dependent = NULL_RTX;
6925
6926   REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
6927   REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
6928
6929   count = regs->array[REGNO (dest_reg)].n_times_set - 1;
6930
6931   while (count > 0)
6932     {
6933       p = NEXT_INSN (p);
6934       code = GET_CODE (p);
6935
6936       /* If libcall, skip to end of call sequence.  */
6937       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
6938         p = XEXP (temp, 0);
6939
6940       if (code == INSN
6941           && (set = single_set (p))
6942           && GET_CODE (SET_DEST (set)) == REG
6943           && SET_DEST (set) == dest_reg
6944           && (general_induction_var (loop, SET_SRC (set), &src_reg,
6945                                      add_val, mult_val, ext_val, 0,
6946                                      &benefit, VOIDmode)
6947               /* Giv created by equivalent expression.  */
6948               || ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX))
6949                   && general_induction_var (loop, XEXP (temp, 0), &src_reg,
6950                                             add_val, mult_val, ext_val, 0,
6951                                             &benefit, VOIDmode)))
6952           && src_reg == v->src_reg)
6953         {
6954           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
6955             benefit += libcall_benefit (p);
6956
6957           count--;
6958           v->mult_val = *mult_val;
6959           v->add_val = *add_val;
6960           v->benefit += benefit;
6961         }
6962       else if (code != NOTE)
6963         {
6964           /* Allow insns that set something other than this giv to a
6965              constant.  Such insns are needed on machines which cannot
6966              include long constants and should not disqualify a giv.  */
6967           if (code == INSN
6968               && (set = single_set (p))
6969               && SET_DEST (set) != dest_reg
6970               && CONSTANT_P (SET_SRC (set)))
6971             continue;
6972
6973           REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
6974           return 0;
6975         }
6976     }
6977
6978   REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
6979   *last_consec_insn = p;
6980   return v->benefit;
6981 }
6982 \f
6983 /* Return an rtx, if any, that expresses giv G2 as a function of the register
6984    represented by G1.  If no such expression can be found, or it is clear that
6985    it cannot possibly be a valid address, 0 is returned.
6986
6987    To perform the computation, we note that
6988         G1 = x * v + a          and
6989         G2 = y * v + b
6990    where `v' is the biv.
6991
6992    So G2 = (y/b) * G1 + (b - a*y/x).
6993
6994    Note that MULT = y/x.
6995
6996    Update: A and B are now allowed to be additive expressions such that
6997    B contains all variables in A.  That is, computing B-A will not require
6998    subtracting variables.  */
6999
7000 static rtx
7001 express_from_1 (a, b, mult)
7002      rtx a, b, mult;
7003 {
7004   /* If MULT is zero, then A*MULT is zero, and our expression is B.  */
7005
7006   if (mult == const0_rtx)
7007     return b;
7008
7009   /* If MULT is not 1, we cannot handle A with non-constants, since we
7010      would then be required to subtract multiples of the registers in A.
7011      This is theoretically possible, and may even apply to some Fortran
7012      constructs, but it is a lot of work and we do not attempt it here.  */
7013
7014   if (mult != const1_rtx && GET_CODE (a) != CONST_INT)
7015     return NULL_RTX;
7016
7017   /* In general these structures are sorted top to bottom (down the PLUS
7018      chain), but not left to right across the PLUS.  If B is a higher
7019      order giv than A, we can strip one level and recurse.  If A is higher
7020      order, we'll eventually bail out, but won't know that until the end.
7021      If they are the same, we'll strip one level around this loop.  */
7022
7023   while (GET_CODE (a) == PLUS && GET_CODE (b) == PLUS)
7024     {
7025       rtx ra, rb, oa, ob, tmp;
7026
7027       ra = XEXP (a, 0), oa = XEXP (a, 1);
7028       if (GET_CODE (ra) == PLUS)
7029         tmp = ra, ra = oa, oa = tmp;
7030
7031       rb = XEXP (b, 0), ob = XEXP (b, 1);
7032       if (GET_CODE (rb) == PLUS)
7033         tmp = rb, rb = ob, ob = tmp;
7034
7035       if (rtx_equal_p (ra, rb))
7036         /* We matched: remove one reg completely.  */
7037         a = oa, b = ob;
7038       else if (GET_CODE (ob) != PLUS && rtx_equal_p (ra, ob))
7039         /* An alternate match.  */
7040         a = oa, b = rb;
7041       else if (GET_CODE (oa) != PLUS && rtx_equal_p (oa, rb))
7042         /* An alternate match.  */
7043         a = ra, b = ob;
7044       else
7045         {
7046           /* Indicates an extra register in B.  Strip one level from B and
7047              recurse, hoping B was the higher order expression.  */
7048           ob = express_from_1 (a, ob, mult);
7049           if (ob == NULL_RTX)
7050             return NULL_RTX;
7051           return gen_rtx_PLUS (GET_MODE (b), rb, ob);
7052         }
7053     }
7054
7055   /* Here we are at the last level of A, go through the cases hoping to
7056      get rid of everything but a constant.  */
7057
7058   if (GET_CODE (a) == PLUS)
7059     {
7060       rtx ra, oa;
7061
7062       ra = XEXP (a, 0), oa = XEXP (a, 1);
7063       if (rtx_equal_p (oa, b))
7064         oa = ra;
7065       else if (!rtx_equal_p (ra, b))
7066         return NULL_RTX;
7067
7068       if (GET_CODE (oa) != CONST_INT)
7069         return NULL_RTX;
7070
7071       return GEN_INT (-INTVAL (oa) * INTVAL (mult));
7072     }
7073   else if (GET_CODE (a) == CONST_INT)
7074     {
7075       return plus_constant (b, -INTVAL (a) * INTVAL (mult));
7076     }
7077   else if (CONSTANT_P (a))
7078     {
7079       enum machine_mode mode_a = GET_MODE (a);
7080       enum machine_mode mode_b = GET_MODE (b);
7081       enum machine_mode mode = mode_b == VOIDmode ? mode_a : mode_b;
7082       return simplify_gen_binary (MINUS, mode, b, a);
7083     }
7084   else if (GET_CODE (b) == PLUS)
7085     {
7086       if (rtx_equal_p (a, XEXP (b, 0)))
7087         return XEXP (b, 1);
7088       else if (rtx_equal_p (a, XEXP (b, 1)))
7089         return XEXP (b, 0);
7090       else
7091         return NULL_RTX;
7092     }
7093   else if (rtx_equal_p (a, b))
7094     return const0_rtx;
7095
7096   return NULL_RTX;
7097 }
7098
7099 rtx
7100 express_from (g1, g2)
7101      struct induction *g1, *g2;
7102 {
7103   rtx mult, add;
7104
7105   /* The value that G1 will be multiplied by must be a constant integer.  Also,
7106      the only chance we have of getting a valid address is if b*c/a (see above
7107      for notation) is also an integer.  */
7108   if (GET_CODE (g1->mult_val) == CONST_INT
7109       && GET_CODE (g2->mult_val) == CONST_INT)
7110     {
7111       if (g1->mult_val == const0_rtx
7112           || INTVAL (g2->mult_val) % INTVAL (g1->mult_val) != 0)
7113         return NULL_RTX;
7114       mult = GEN_INT (INTVAL (g2->mult_val) / INTVAL (g1->mult_val));
7115     }
7116   else if (rtx_equal_p (g1->mult_val, g2->mult_val))
7117     mult = const1_rtx;
7118   else
7119     {
7120       /* ??? Find out if the one is a multiple of the other?  */
7121       return NULL_RTX;
7122     }
7123
7124   add = express_from_1 (g1->add_val, g2->add_val, mult);
7125   if (add == NULL_RTX)
7126     {
7127       /* Failed.  If we've got a multiplication factor between G1 and G2,
7128          scale G1's addend and try again.  */
7129       if (INTVAL (mult) > 1)
7130         {
7131           rtx g1_add_val = g1->add_val;
7132           if (GET_CODE (g1_add_val) == MULT
7133               && GET_CODE (XEXP (g1_add_val, 1)) == CONST_INT)
7134             {
7135               HOST_WIDE_INT m;
7136               m = INTVAL (mult) * INTVAL (XEXP (g1_add_val, 1));
7137               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val),
7138                                          XEXP (g1_add_val, 0), GEN_INT (m));
7139             }
7140           else
7141             {
7142               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val), g1_add_val,
7143                                          mult);
7144             }
7145
7146           add = express_from_1 (g1_add_val, g2->add_val, const1_rtx);
7147         }
7148     }
7149   if (add == NULL_RTX)
7150     return NULL_RTX;
7151
7152   /* Form simplified final result.  */
7153   if (mult == const0_rtx)
7154     return add;
7155   else if (mult == const1_rtx)
7156     mult = g1->dest_reg;
7157   else
7158     mult = gen_rtx_MULT (g2->mode, g1->dest_reg, mult);
7159
7160   if (add == const0_rtx)
7161     return mult;
7162   else
7163     {
7164       if (GET_CODE (add) == PLUS
7165           && CONSTANT_P (XEXP (add, 1)))
7166         {
7167           rtx tem = XEXP (add, 1);
7168           mult = gen_rtx_PLUS (g2->mode, mult, XEXP (add, 0));
7169           add = tem;
7170         }
7171
7172       return gen_rtx_PLUS (g2->mode, mult, add);
7173     }
7174 }
7175 \f
7176 /* Return an rtx, if any, that expresses giv G2 as a function of the register
7177    represented by G1.  This indicates that G2 should be combined with G1 and
7178    that G2 can use (either directly or via an address expression) a register
7179    used to represent G1.  */
7180
7181 static rtx
7182 combine_givs_p (g1, g2)
7183      struct induction *g1, *g2;
7184 {
7185   rtx comb, ret;
7186
7187   /* With the introduction of ext dependent givs, we must care for modes.
7188      G2 must not use a wider mode than G1.  */
7189   if (GET_MODE_SIZE (g1->mode) < GET_MODE_SIZE (g2->mode))
7190     return NULL_RTX;
7191
7192   ret = comb = express_from (g1, g2);
7193   if (comb == NULL_RTX)
7194     return NULL_RTX;
7195   if (g1->mode != g2->mode)
7196     ret = gen_lowpart (g2->mode, comb);
7197
7198   /* If these givs are identical, they can be combined.  We use the results
7199      of express_from because the addends are not in a canonical form, so
7200      rtx_equal_p is a weaker test.  */
7201   /* But don't combine a DEST_REG giv with a DEST_ADDR giv; we want the
7202      combination to be the other way round.  */
7203   if (comb == g1->dest_reg
7204       && (g1->giv_type == DEST_REG || g2->giv_type == DEST_ADDR))
7205     {
7206       return ret;
7207     }
7208
7209   /* If G2 can be expressed as a function of G1 and that function is valid
7210      as an address and no more expensive than using a register for G2,
7211      the expression of G2 in terms of G1 can be used.  */
7212   if (ret != NULL_RTX
7213       && g2->giv_type == DEST_ADDR
7214       && memory_address_p (GET_MODE (g2->mem), ret)
7215       /* ??? Looses, especially with -fforce-addr, where *g2->location
7216          will always be a register, and so anything more complicated
7217          gets discarded.  */
7218 #if 0
7219 #ifdef ADDRESS_COST
7220       && ADDRESS_COST (tem) <= ADDRESS_COST (*g2->location)
7221 #else
7222       && rtx_cost (tem, MEM) <= rtx_cost (*g2->location, MEM)
7223 #endif
7224 #endif
7225       )
7226     {
7227       return ret;
7228     }
7229
7230   return NULL_RTX;
7231 }
7232 \f
7233 /* Check each extension dependent giv in this class to see if its
7234    root biv is safe from wrapping in the interior mode, which would
7235    make the giv illegal.  */
7236
7237 static void
7238 check_ext_dependent_givs (bl, loop_info)
7239      struct iv_class *bl;
7240      struct loop_info *loop_info;
7241 {
7242   int ze_ok = 0, se_ok = 0, info_ok = 0;
7243   enum machine_mode biv_mode = GET_MODE (bl->biv->src_reg);
7244   HOST_WIDE_INT start_val;
7245   unsigned HOST_WIDE_INT u_end_val = 0;
7246   unsigned HOST_WIDE_INT u_start_val = 0;
7247   rtx incr = pc_rtx;
7248   struct induction *v;
7249
7250   /* Make sure the iteration data is available.  We must have
7251      constants in order to be certain of no overflow.  */
7252   /* ??? An unknown iteration count with an increment of +-1
7253      combined with friendly exit tests of against an invariant
7254      value is also ameanable to optimization.  Not implemented.  */
7255   if (loop_info->n_iterations > 0
7256       && bl->initial_value
7257       && GET_CODE (bl->initial_value) == CONST_INT
7258       && (incr = biv_total_increment (bl))
7259       && GET_CODE (incr) == CONST_INT
7260       /* Make sure the host can represent the arithmetic.  */
7261       && HOST_BITS_PER_WIDE_INT >= GET_MODE_BITSIZE (biv_mode))
7262     {
7263       unsigned HOST_WIDE_INT abs_incr, total_incr;
7264       HOST_WIDE_INT s_end_val;
7265       int neg_incr;
7266
7267       info_ok = 1;
7268       start_val = INTVAL (bl->initial_value);
7269       u_start_val = start_val;
7270
7271       neg_incr = 0, abs_incr = INTVAL (incr);
7272       if (INTVAL (incr) < 0)
7273         neg_incr = 1, abs_incr = -abs_incr;
7274       total_incr = abs_incr * loop_info->n_iterations;
7275
7276       /* Check for host arithmatic overflow.  */
7277       if (total_incr / loop_info->n_iterations == abs_incr)
7278         {
7279           unsigned HOST_WIDE_INT u_max;
7280           HOST_WIDE_INT s_max;
7281
7282           u_end_val = start_val + (neg_incr ? -total_incr : total_incr);
7283           s_end_val = u_end_val;
7284           u_max = GET_MODE_MASK (biv_mode);
7285           s_max = u_max >> 1;
7286
7287           /* Check zero extension of biv ok.  */
7288           if (start_val >= 0
7289               /* Check for host arithmatic overflow.  */
7290               && (neg_incr
7291                   ? u_end_val < u_start_val
7292                   : u_end_val > u_start_val)
7293               /* Check for target arithmetic overflow.  */
7294               && (neg_incr
7295                   ? 1 /* taken care of with host overflow */
7296                   : u_end_val <= u_max))
7297             {
7298               ze_ok = 1;
7299             }
7300
7301           /* Check sign extension of biv ok.  */
7302           /* ??? While it is true that overflow with signed and pointer
7303              arithmetic is undefined, I fear too many programmers don't
7304              keep this fact in mind -- myself included on occasion.
7305              So leave alone with the signed overflow optimizations.  */
7306           if (start_val >= -s_max - 1
7307               /* Check for host arithmatic overflow.  */
7308               && (neg_incr
7309                   ? s_end_val < start_val
7310                   : s_end_val > start_val)
7311               /* Check for target arithmetic overflow.  */
7312               && (neg_incr
7313                   ? s_end_val >= -s_max - 1
7314                   : s_end_val <= s_max))
7315             {
7316               se_ok = 1;
7317             }
7318         }
7319     }
7320
7321   /* Invalidate givs that fail the tests.  */
7322   for (v = bl->giv; v; v = v->next_iv)
7323     if (v->ext_dependent)
7324       {
7325         enum rtx_code code = GET_CODE (v->ext_dependent);
7326         int ok = 0;
7327
7328         switch (code)
7329           {
7330           case SIGN_EXTEND:
7331             ok = se_ok;
7332             break;
7333           case ZERO_EXTEND:
7334             ok = ze_ok;
7335             break;
7336
7337           case TRUNCATE:
7338             /* We don't know whether this value is being used as either
7339                signed or unsigned, so to safely truncate we must satisfy
7340                both.  The initial check here verifies the BIV itself;
7341                once that is successful we may check its range wrt the
7342                derived GIV.  */
7343             if (se_ok && ze_ok)
7344               {
7345                 enum machine_mode outer_mode = GET_MODE (v->ext_dependent);
7346                 unsigned HOST_WIDE_INT max = GET_MODE_MASK (outer_mode) >> 1;
7347
7348                 /* We know from the above that both endpoints are nonnegative,
7349                    and that there is no wrapping.  Verify that both endpoints
7350                    are within the (signed) range of the outer mode.  */
7351                 if (u_start_val <= max && u_end_val <= max)
7352                   ok = 1;
7353               }
7354             break;
7355
7356           default:
7357             abort ();
7358           }
7359
7360         if (ok)
7361           {
7362             if (loop_dump_stream)
7363               {
7364                 fprintf (loop_dump_stream,
7365                          "Verified ext dependent giv at %d of reg %d\n",
7366                          INSN_UID (v->insn), bl->regno);
7367               }
7368           }
7369         else
7370           {
7371             if (loop_dump_stream)
7372               {
7373                 const char *why;
7374
7375                 if (info_ok)
7376                   why = "biv iteration values overflowed";
7377                 else
7378                   {
7379                     if (incr == pc_rtx)
7380                       incr = biv_total_increment (bl);
7381                     if (incr == const1_rtx)
7382                       why = "biv iteration info incomplete; incr by 1";
7383                     else
7384                       why = "biv iteration info incomplete";
7385                   }
7386
7387                 fprintf (loop_dump_stream,
7388                          "Failed ext dependent giv at %d, %s\n",
7389                          INSN_UID (v->insn), why);
7390               }
7391             v->ignore = 1;
7392             bl->all_reduced = 0;
7393           }
7394       }
7395 }
7396
7397 /* Generate a version of VALUE in a mode appropriate for initializing V.  */
7398
7399 rtx
7400 extend_value_for_giv (v, value)
7401      struct induction *v;
7402      rtx value;
7403 {
7404   rtx ext_dep = v->ext_dependent;
7405
7406   if (! ext_dep)
7407     return value;
7408
7409   /* Recall that check_ext_dependent_givs verified that the known bounds
7410      of a biv did not overflow or wrap with respect to the extension for
7411      the giv.  Therefore, constants need no additional adjustment.  */
7412   if (CONSTANT_P (value) && GET_MODE (value) == VOIDmode)
7413     return value;
7414
7415   /* Otherwise, we must adjust the value to compensate for the
7416      differing modes of the biv and the giv.  */
7417   return gen_rtx_fmt_e (GET_CODE (ext_dep), GET_MODE (ext_dep), value);
7418 }
7419 \f
7420 struct combine_givs_stats
7421 {
7422   int giv_number;
7423   int total_benefit;
7424 };
7425
7426 static int
7427 cmp_combine_givs_stats (xp, yp)
7428      const PTR xp;
7429      const PTR yp;
7430 {
7431   const struct combine_givs_stats * const x =
7432     (const struct combine_givs_stats *) xp;
7433   const struct combine_givs_stats * const y =
7434     (const struct combine_givs_stats *) yp;
7435   int d;
7436   d = y->total_benefit - x->total_benefit;
7437   /* Stabilize the sort.  */
7438   if (!d)
7439     d = x->giv_number - y->giv_number;
7440   return d;
7441 }
7442
7443 /* Check all pairs of givs for iv_class BL and see if any can be combined with
7444    any other.  If so, point SAME to the giv combined with and set NEW_REG to
7445    be an expression (in terms of the other giv's DEST_REG) equivalent to the
7446    giv.  Also, update BENEFIT and related fields for cost/benefit analysis.  */
7447
7448 static void
7449 combine_givs (regs, bl)
7450      struct loop_regs *regs;
7451      struct iv_class *bl;
7452 {
7453   /* Additional benefit to add for being combined multiple times.  */
7454   const int extra_benefit = 3;
7455
7456   struct induction *g1, *g2, **giv_array;
7457   int i, j, k, giv_count;
7458   struct combine_givs_stats *stats;
7459   rtx *can_combine;
7460
7461   /* Count givs, because bl->giv_count is incorrect here.  */
7462   giv_count = 0;
7463   for (g1 = bl->giv; g1; g1 = g1->next_iv)
7464     if (!g1->ignore)
7465       giv_count++;
7466
7467   giv_array
7468     = (struct induction **) alloca (giv_count * sizeof (struct induction *));
7469   i = 0;
7470   for (g1 = bl->giv; g1; g1 = g1->next_iv)
7471     if (!g1->ignore)
7472       giv_array[i++] = g1;
7473
7474   stats = (struct combine_givs_stats *) xcalloc (giv_count, sizeof (*stats));
7475   can_combine = (rtx *) xcalloc (giv_count, giv_count * sizeof (rtx));
7476
7477   for (i = 0; i < giv_count; i++)
7478     {
7479       int this_benefit;
7480       rtx single_use;
7481
7482       g1 = giv_array[i];
7483       stats[i].giv_number = i;
7484
7485       /* If a DEST_REG GIV is used only once, do not allow it to combine
7486          with anything, for in doing so we will gain nothing that cannot
7487          be had by simply letting the GIV with which we would have combined
7488          to be reduced on its own.  The losage shows up in particular with
7489          DEST_ADDR targets on hosts with reg+reg addressing, though it can
7490          be seen elsewhere as well.  */
7491       if (g1->giv_type == DEST_REG
7492           && (single_use = regs->array[REGNO (g1->dest_reg)].single_usage)
7493           && single_use != const0_rtx)
7494         continue;
7495
7496       this_benefit = g1->benefit;
7497       /* Add an additional weight for zero addends.  */
7498       if (g1->no_const_addval)
7499         this_benefit += 1;
7500
7501       for (j = 0; j < giv_count; j++)
7502         {
7503           rtx this_combine;
7504
7505           g2 = giv_array[j];
7506           if (g1 != g2
7507               && (this_combine = combine_givs_p (g1, g2)) != NULL_RTX)
7508             {
7509               can_combine[i * giv_count + j] = this_combine;
7510               this_benefit += g2->benefit + extra_benefit;
7511             }
7512         }
7513       stats[i].total_benefit = this_benefit;
7514     }
7515
7516   /* Iterate, combining until we can't.  */
7517 restart:
7518   qsort (stats, giv_count, sizeof (*stats), cmp_combine_givs_stats);
7519
7520   if (loop_dump_stream)
7521     {
7522       fprintf (loop_dump_stream, "Sorted combine statistics:\n");
7523       for (k = 0; k < giv_count; k++)
7524         {
7525           g1 = giv_array[stats[k].giv_number];
7526           if (!g1->combined_with && !g1->same)
7527             fprintf (loop_dump_stream, " {%d, %d}",
7528                      INSN_UID (giv_array[stats[k].giv_number]->insn),
7529                      stats[k].total_benefit);
7530         }
7531       putc ('\n', loop_dump_stream);
7532     }
7533
7534   for (k = 0; k < giv_count; k++)
7535     {
7536       int g1_add_benefit = 0;
7537
7538       i = stats[k].giv_number;
7539       g1 = giv_array[i];
7540
7541       /* If it has already been combined, skip.  */
7542       if (g1->combined_with || g1->same)
7543         continue;
7544
7545       for (j = 0; j < giv_count; j++)
7546         {
7547           g2 = giv_array[j];
7548           if (g1 != g2 && can_combine[i * giv_count + j]
7549               /* If it has already been combined, skip.  */
7550               && ! g2->same && ! g2->combined_with)
7551             {
7552               int l;
7553
7554               g2->new_reg = can_combine[i * giv_count + j];
7555               g2->same = g1;
7556               /* For destination, we now may replace by mem expression instead
7557                  of register.  This changes the costs considerably, so add the
7558                  compensation.  */
7559               if (g2->giv_type == DEST_ADDR)
7560                 g2->benefit = (g2->benefit + reg_address_cost
7561                                - address_cost (g2->new_reg,
7562                                GET_MODE (g2->mem)));
7563               g1->combined_with++;
7564               g1->lifetime += g2->lifetime;
7565
7566               g1_add_benefit += g2->benefit;
7567
7568               /* ??? The new final_[bg]iv_value code does a much better job
7569                  of finding replaceable giv's, and hence this code may no
7570                  longer be necessary.  */
7571               if (! g2->replaceable && REG_USERVAR_P (g2->dest_reg))
7572                 g1_add_benefit -= copy_cost;
7573
7574               /* To help optimize the next set of combinations, remove
7575                  this giv from the benefits of other potential mates.  */
7576               for (l = 0; l < giv_count; ++l)
7577                 {
7578                   int m = stats[l].giv_number;
7579                   if (can_combine[m * giv_count + j])
7580                     stats[l].total_benefit -= g2->benefit + extra_benefit;
7581                 }
7582
7583               if (loop_dump_stream)
7584                 fprintf (loop_dump_stream,
7585                          "giv at %d combined with giv at %d; new benefit %d + %d, lifetime %d\n",
7586                          INSN_UID (g2->insn), INSN_UID (g1->insn),
7587                          g1->benefit, g1_add_benefit, g1->lifetime);
7588             }
7589         }
7590
7591       /* To help optimize the next set of combinations, remove
7592          this giv from the benefits of other potential mates.  */
7593       if (g1->combined_with)
7594         {
7595           for (j = 0; j < giv_count; ++j)
7596             {
7597               int m = stats[j].giv_number;
7598               if (can_combine[m * giv_count + i])
7599                 stats[j].total_benefit -= g1->benefit + extra_benefit;
7600             }
7601
7602           g1->benefit += g1_add_benefit;
7603
7604           /* We've finished with this giv, and everything it touched.
7605              Restart the combination so that proper weights for the
7606              rest of the givs are properly taken into account.  */
7607           /* ??? Ideally we would compact the arrays at this point, so
7608              as to not cover old ground.  But sanely compacting
7609              can_combine is tricky.  */
7610           goto restart;
7611         }
7612     }
7613
7614   /* Clean up.  */
7615   free (stats);
7616   free (can_combine);
7617 }
7618 \f
7619 /* Generate sequence for REG = B * M + A.  */
7620
7621 static rtx
7622 gen_add_mult (b, m, a, reg)
7623      rtx b;          /* initial value of basic induction variable */
7624      rtx m;          /* multiplicative constant */
7625      rtx a;          /* additive constant */
7626      rtx reg;        /* destination register */
7627 {
7628   rtx seq;
7629   rtx result;
7630
7631   start_sequence ();
7632   /* Use unsigned arithmetic.  */
7633   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
7634   if (reg != result)
7635     emit_move_insn (reg, result);
7636   seq = gen_sequence ();
7637   end_sequence ();
7638
7639   return seq;
7640 }
7641
7642
7643 /* Update registers created in insn sequence SEQ.  */
7644
7645 static void
7646 loop_regs_update (loop, seq)
7647      const struct loop *loop ATTRIBUTE_UNUSED;
7648      rtx seq;
7649 {
7650   /* Update register info for alias analysis.  */
7651
7652   if (GET_CODE (seq) == SEQUENCE)
7653     {
7654       int i;
7655       for (i = 0; i < XVECLEN (seq, 0); ++i)
7656         {
7657           rtx set = single_set (XVECEXP (seq, 0, i));
7658           if (set && GET_CODE (SET_DEST (set)) == REG)
7659             record_base_value (REGNO (SET_DEST (set)), SET_SRC (set), 0);
7660         }
7661     }
7662   else
7663     {
7664       if (GET_CODE (seq) == SET
7665           && GET_CODE (SET_DEST (seq)) == REG)
7666         record_base_value (REGNO (SET_DEST (seq)), SET_SRC (seq), 0);
7667     }
7668 }
7669
7670
7671 /* EMIT code before BEFORE_BB/BEFORE_INSN to set REG = B * M + A.  */
7672
7673 void
7674 loop_iv_add_mult_emit_before (loop, b, m, a, reg, before_bb, before_insn)
7675      const struct loop *loop;
7676      rtx b;          /* initial value of basic induction variable */
7677      rtx m;          /* multiplicative constant */
7678      rtx a;          /* additive constant */
7679      rtx reg;        /* destination register */
7680      basic_block before_bb;
7681      rtx before_insn;
7682 {
7683   rtx seq;
7684
7685   if (! before_insn)
7686     {
7687       loop_iv_add_mult_hoist (loop, b, m, a, reg);
7688       return;
7689     }
7690
7691   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7692   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7693
7694   /* Increase the lifetime of any invariants moved further in code.  */
7695   update_reg_last_use (a, before_insn);
7696   update_reg_last_use (b, before_insn);
7697   update_reg_last_use (m, before_insn);
7698
7699   loop_insn_emit_before (loop, before_bb, before_insn, seq);
7700
7701   /* It is possible that the expansion created lots of new registers.
7702      Iterate over the sequence we just created and record them all.  */
7703   loop_regs_update (loop, seq);
7704 }
7705
7706
7707 /* Emit insns in loop pre-header to set REG = B * M + A.  */
7708
7709 void
7710 loop_iv_add_mult_sink (loop, b, m, a, reg)
7711      const struct loop *loop;
7712      rtx b;          /* initial value of basic induction variable */
7713      rtx m;          /* multiplicative constant */
7714      rtx a;          /* additive constant */
7715      rtx reg;        /* destination register */
7716 {
7717   rtx seq;
7718
7719   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7720   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7721
7722   /* Increase the lifetime of any invariants moved further in code.
7723      ???? Is this really necessary?  */
7724   update_reg_last_use (a, loop->sink);
7725   update_reg_last_use (b, loop->sink);
7726   update_reg_last_use (m, loop->sink);
7727
7728   loop_insn_sink (loop, seq);
7729
7730   /* It is possible that the expansion created lots of new registers.
7731      Iterate over the sequence we just created and record them all.  */
7732   loop_regs_update (loop, seq);
7733 }
7734
7735
7736 /* Emit insns after loop to set REG = B * M + A.  */
7737
7738 void
7739 loop_iv_add_mult_hoist (loop, b, m, a, reg)
7740      const struct loop *loop;
7741      rtx b;          /* initial value of basic induction variable */
7742      rtx m;          /* multiplicative constant */
7743      rtx a;          /* additive constant */
7744      rtx reg;        /* destination register */
7745 {
7746   rtx seq;
7747
7748   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7749   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7750
7751   loop_insn_hoist (loop, seq);
7752
7753   /* It is possible that the expansion created lots of new registers.
7754      Iterate over the sequence we just created and record them all.  */
7755   loop_regs_update (loop, seq);
7756 }
7757
7758
7759
7760 /* Similar to gen_add_mult, but compute cost rather than generating
7761    sequence.  */
7762
7763 static int
7764 iv_add_mult_cost (b, m, a, reg)
7765      rtx b;          /* initial value of basic induction variable */
7766      rtx m;          /* multiplicative constant */
7767      rtx a;          /* additive constant */
7768      rtx reg;        /* destination register */
7769 {
7770   int cost = 0;
7771   rtx last, result;
7772
7773   start_sequence ();
7774   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
7775   if (reg != result)
7776     emit_move_insn (reg, result);
7777   last = get_last_insn ();
7778   while (last)
7779     {
7780       rtx t = single_set (last);
7781       if (t)
7782         cost += rtx_cost (SET_SRC (t), SET);
7783       last = PREV_INSN (last);
7784     }
7785   end_sequence ();
7786   return cost;
7787 }
7788 \f
7789 /* Test whether A * B can be computed without
7790    an actual multiply insn.  Value is 1 if so.  */
7791
7792 static int
7793 product_cheap_p (a, b)
7794      rtx a;
7795      rtx b;
7796 {
7797   int i;
7798   rtx tmp;
7799   int win = 1;
7800
7801   /* If only one is constant, make it B.  */
7802   if (GET_CODE (a) == CONST_INT)
7803     tmp = a, a = b, b = tmp;
7804
7805   /* If first constant, both constant, so don't need multiply.  */
7806   if (GET_CODE (a) == CONST_INT)
7807     return 1;
7808
7809   /* If second not constant, neither is constant, so would need multiply.  */
7810   if (GET_CODE (b) != CONST_INT)
7811     return 0;
7812
7813   /* One operand is constant, so might not need multiply insn.  Generate the
7814      code for the multiply and see if a call or multiply, or long sequence
7815      of insns is generated.  */
7816
7817   start_sequence ();
7818   expand_mult (GET_MODE (a), a, b, NULL_RTX, 1);
7819   tmp = gen_sequence ();
7820   end_sequence ();
7821
7822   if (GET_CODE (tmp) == SEQUENCE)
7823     {
7824       if (XVEC (tmp, 0) == 0)
7825         win = 1;
7826       else if (XVECLEN (tmp, 0) > 3)
7827         win = 0;
7828       else
7829         for (i = 0; i < XVECLEN (tmp, 0); i++)
7830           {
7831             rtx insn = XVECEXP (tmp, 0, i);
7832
7833             if (GET_CODE (insn) != INSN
7834                 || (GET_CODE (PATTERN (insn)) == SET
7835                     && GET_CODE (SET_SRC (PATTERN (insn))) == MULT)
7836                 || (GET_CODE (PATTERN (insn)) == PARALLEL
7837                     && GET_CODE (XVECEXP (PATTERN (insn), 0, 0)) == SET
7838                     && GET_CODE (SET_SRC (XVECEXP (PATTERN (insn), 0, 0))) == MULT))
7839               {
7840                 win = 0;
7841                 break;
7842               }
7843           }
7844     }
7845   else if (GET_CODE (tmp) == SET
7846            && GET_CODE (SET_SRC (tmp)) == MULT)
7847     win = 0;
7848   else if (GET_CODE (tmp) == PARALLEL
7849            && GET_CODE (XVECEXP (tmp, 0, 0)) == SET
7850            && GET_CODE (SET_SRC (XVECEXP (tmp, 0, 0))) == MULT)
7851     win = 0;
7852
7853   return win;
7854 }
7855 \f
7856 /* Check to see if loop can be terminated by a "decrement and branch until
7857    zero" instruction.  If so, add a REG_NONNEG note to the branch insn if so.
7858    Also try reversing an increment loop to a decrement loop
7859    to see if the optimization can be performed.
7860    Value is nonzero if optimization was performed.  */
7861
7862 /* This is useful even if the architecture doesn't have such an insn,
7863    because it might change a loops which increments from 0 to n to a loop
7864    which decrements from n to 0.  A loop that decrements to zero is usually
7865    faster than one that increments from zero.  */
7866
7867 /* ??? This could be rewritten to use some of the loop unrolling procedures,
7868    such as approx_final_value, biv_total_increment, loop_iterations, and
7869    final_[bg]iv_value.  */
7870
7871 static int
7872 check_dbra_loop (loop, insn_count)
7873      struct loop *loop;
7874      int insn_count;
7875 {
7876   struct loop_info *loop_info = LOOP_INFO (loop);
7877   struct loop_regs *regs = LOOP_REGS (loop);
7878   struct loop_ivs *ivs = LOOP_IVS (loop);
7879   struct iv_class *bl;
7880   rtx reg;
7881   rtx jump_label;
7882   rtx final_value;
7883   rtx start_value;
7884   rtx new_add_val;
7885   rtx comparison;
7886   rtx before_comparison;
7887   rtx p;
7888   rtx jump;
7889   rtx first_compare;
7890   int compare_and_branch;
7891   rtx loop_start = loop->start;
7892   rtx loop_end = loop->end;
7893
7894   /* If last insn is a conditional branch, and the insn before tests a
7895      register value, try to optimize it.  Otherwise, we can't do anything.  */
7896
7897   jump = PREV_INSN (loop_end);
7898   comparison = get_condition_for_loop (loop, jump);
7899   if (comparison == 0)
7900     return 0;
7901   if (!onlyjump_p (jump))
7902     return 0;
7903
7904   /* Try to compute whether the compare/branch at the loop end is one or
7905      two instructions.  */
7906   get_condition (jump, &first_compare);
7907   if (first_compare == jump)
7908     compare_and_branch = 1;
7909   else if (first_compare == prev_nonnote_insn (jump))
7910     compare_and_branch = 2;
7911   else
7912     return 0;
7913
7914   {
7915     /* If more than one condition is present to control the loop, then
7916        do not proceed, as this function does not know how to rewrite
7917        loop tests with more than one condition.
7918
7919        Look backwards from the first insn in the last comparison
7920        sequence and see if we've got another comparison sequence.  */
7921
7922     rtx jump1;
7923     if ((jump1 = prev_nonnote_insn (first_compare)) != loop->cont)
7924       if (GET_CODE (jump1) == JUMP_INSN)
7925         return 0;
7926   }
7927
7928   /* Check all of the bivs to see if the compare uses one of them.
7929      Skip biv's set more than once because we can't guarantee that
7930      it will be zero on the last iteration.  Also skip if the biv is
7931      used between its update and the test insn.  */
7932
7933   for (bl = ivs->list; bl; bl = bl->next)
7934     {
7935       if (bl->biv_count == 1
7936           && ! bl->biv->maybe_multiple
7937           && bl->biv->dest_reg == XEXP (comparison, 0)
7938           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
7939                                    first_compare))
7940         break;
7941     }
7942
7943   if (! bl)
7944     return 0;
7945
7946   /* Look for the case where the basic induction variable is always
7947      nonnegative, and equals zero on the last iteration.
7948      In this case, add a reg_note REG_NONNEG, which allows the
7949      m68k DBRA instruction to be used.  */
7950
7951   if (((GET_CODE (comparison) == GT
7952         && GET_CODE (XEXP (comparison, 1)) == CONST_INT
7953         && INTVAL (XEXP (comparison, 1)) == -1)
7954        || (GET_CODE (comparison) == NE && XEXP (comparison, 1) == const0_rtx))
7955       && GET_CODE (bl->biv->add_val) == CONST_INT
7956       && INTVAL (bl->biv->add_val) < 0)
7957     {
7958       /* Initial value must be greater than 0,
7959          init_val % -dec_value == 0 to ensure that it equals zero on
7960          the last iteration */
7961
7962       if (GET_CODE (bl->initial_value) == CONST_INT
7963           && INTVAL (bl->initial_value) > 0
7964           && (INTVAL (bl->initial_value)
7965               % (-INTVAL (bl->biv->add_val))) == 0)
7966         {
7967           /* register always nonnegative, add REG_NOTE to branch */
7968           if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
7969             REG_NOTES (jump)
7970               = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
7971                                    REG_NOTES (jump));
7972           bl->nonneg = 1;
7973
7974           return 1;
7975         }
7976
7977       /* If the decrement is 1 and the value was tested as >= 0 before
7978          the loop, then we can safely optimize.  */
7979       for (p = loop_start; p; p = PREV_INSN (p))
7980         {
7981           if (GET_CODE (p) == CODE_LABEL)
7982             break;
7983           if (GET_CODE (p) != JUMP_INSN)
7984             continue;
7985
7986           before_comparison = get_condition_for_loop (loop, p);
7987           if (before_comparison
7988               && XEXP (before_comparison, 0) == bl->biv->dest_reg
7989               && GET_CODE (before_comparison) == LT
7990               && XEXP (before_comparison, 1) == const0_rtx
7991               && ! reg_set_between_p (bl->biv->dest_reg, p, loop_start)
7992               && INTVAL (bl->biv->add_val) == -1)
7993             {
7994               if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
7995                 REG_NOTES (jump)
7996                   = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
7997                                        REG_NOTES (jump));
7998               bl->nonneg = 1;
7999
8000               return 1;
8001             }
8002         }
8003     }
8004   else if (GET_CODE (bl->biv->add_val) == CONST_INT
8005            && INTVAL (bl->biv->add_val) > 0)
8006     {
8007       /* Try to change inc to dec, so can apply above optimization.  */
8008       /* Can do this if:
8009          all registers modified are induction variables or invariant,
8010          all memory references have non-overlapping addresses
8011          (obviously true if only one write)
8012          allow 2 insns for the compare/jump at the end of the loop.  */
8013       /* Also, we must avoid any instructions which use both the reversed
8014          biv and another biv.  Such instructions will fail if the loop is
8015          reversed.  We meet this condition by requiring that either
8016          no_use_except_counting is true, or else that there is only
8017          one biv.  */
8018       int num_nonfixed_reads = 0;
8019       /* 1 if the iteration var is used only to count iterations.  */
8020       int no_use_except_counting = 0;
8021       /* 1 if the loop has no memory store, or it has a single memory store
8022          which is reversible.  */
8023       int reversible_mem_store = 1;
8024
8025       if (bl->giv_count == 0
8026           && !loop->exit_count
8027           && !loop_info->has_multiple_exit_targets)
8028         {
8029           rtx bivreg = regno_reg_rtx[bl->regno];
8030           struct iv_class *blt;
8031
8032           /* If there are no givs for this biv, and the only exit is the
8033              fall through at the end of the loop, then
8034              see if perhaps there are no uses except to count.  */
8035           no_use_except_counting = 1;
8036           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8037             if (INSN_P (p))
8038               {
8039                 rtx set = single_set (p);
8040
8041                 if (set && GET_CODE (SET_DEST (set)) == REG
8042                     && REGNO (SET_DEST (set)) == bl->regno)
8043                   /* An insn that sets the biv is okay.  */
8044                   ;
8045                 else if ((p == prev_nonnote_insn (prev_nonnote_insn (loop_end))
8046                           || p == prev_nonnote_insn (loop_end))
8047                          && reg_mentioned_p (bivreg, PATTERN (p)))
8048                   {
8049                     /* If either of these insns uses the biv and sets a pseudo
8050                        that has more than one usage, then the biv has uses
8051                        other than counting since it's used to derive a value
8052                        that is used more than one time.  */
8053                     note_stores (PATTERN (p), note_set_pseudo_multiple_uses,
8054                                  regs);
8055                     if (regs->multiple_uses)
8056                       {
8057                         no_use_except_counting = 0;
8058                         break;
8059                       }
8060                   }
8061                 else if (reg_mentioned_p (bivreg, PATTERN (p)))
8062                   {
8063                     no_use_except_counting = 0;
8064                     break;
8065                   }
8066               }
8067
8068           /* A biv has uses besides counting if it is used to set
8069              another biv.  */
8070           for (blt = ivs->list; blt; blt = blt->next)
8071             if (blt->init_set
8072                 && reg_mentioned_p (bivreg, SET_SRC (blt->init_set)))
8073               {
8074                 no_use_except_counting = 0;
8075                 break;
8076               }
8077         }
8078
8079       if (no_use_except_counting)
8080         /* No need to worry about MEMs.  */
8081         ;
8082       else if (loop_info->num_mem_sets <= 1)
8083         {
8084           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8085             if (INSN_P (p))
8086               num_nonfixed_reads += count_nonfixed_reads (loop, PATTERN (p));
8087
8088           /* If the loop has a single store, and the destination address is
8089              invariant, then we can't reverse the loop, because this address
8090              might then have the wrong value at loop exit.
8091              This would work if the source was invariant also, however, in that
8092              case, the insn should have been moved out of the loop.  */
8093
8094           if (loop_info->num_mem_sets == 1)
8095             {
8096               struct induction *v;
8097
8098               /* If we could prove that each of the memory locations
8099                  written to was different, then we could reverse the
8100                  store -- but we don't presently have any way of
8101                  knowing that.  */
8102               reversible_mem_store = 0;
8103
8104               /* If the store depends on a register that is set after the
8105                  store, it depends on the initial value, and is thus not
8106                  reversible.  */
8107               for (v = bl->giv; reversible_mem_store && v; v = v->next_iv)
8108                 {
8109                   if (v->giv_type == DEST_REG
8110                       && reg_mentioned_p (v->dest_reg,
8111                                           PATTERN (loop_info->first_loop_store_insn))
8112                       && loop_insn_first_p (loop_info->first_loop_store_insn,
8113                                             v->insn))
8114                     reversible_mem_store = 0;
8115                 }
8116             }
8117         }
8118       else
8119         return 0;
8120
8121       /* This code only acts for innermost loops.  Also it simplifies
8122          the memory address check by only reversing loops with
8123          zero or one memory access.
8124          Two memory accesses could involve parts of the same array,
8125          and that can't be reversed.
8126          If the biv is used only for counting, than we don't need to worry
8127          about all these things.  */
8128
8129       if ((num_nonfixed_reads <= 1
8130            && ! loop_info->has_nonconst_call
8131            && ! loop_info->has_volatile
8132            && reversible_mem_store
8133            && (bl->giv_count + bl->biv_count + loop_info->num_mem_sets
8134                + num_unmoved_movables (loop) + compare_and_branch == insn_count)
8135            && (bl == ivs->list && bl->next == 0))
8136           || no_use_except_counting)
8137         {
8138           rtx tem;
8139
8140           /* Loop can be reversed.  */
8141           if (loop_dump_stream)
8142             fprintf (loop_dump_stream, "Can reverse loop\n");
8143
8144           /* Now check other conditions:
8145
8146              The increment must be a constant, as must the initial value,
8147              and the comparison code must be LT.
8148
8149              This test can probably be improved since +/- 1 in the constant
8150              can be obtained by changing LT to LE and vice versa; this is
8151              confusing.  */
8152
8153           if (comparison
8154               /* for constants, LE gets turned into LT */
8155               && (GET_CODE (comparison) == LT
8156                   || (GET_CODE (comparison) == LE
8157                       && no_use_except_counting)))
8158             {
8159               HOST_WIDE_INT add_val, add_adjust, comparison_val = 0;
8160               rtx initial_value, comparison_value;
8161               int nonneg = 0;
8162               enum rtx_code cmp_code;
8163               int comparison_const_width;
8164               unsigned HOST_WIDE_INT comparison_sign_mask;
8165
8166               add_val = INTVAL (bl->biv->add_val);
8167               comparison_value = XEXP (comparison, 1);
8168               if (GET_MODE (comparison_value) == VOIDmode)
8169                 comparison_const_width
8170                   = GET_MODE_BITSIZE (GET_MODE (XEXP (comparison, 0)));
8171               else
8172                 comparison_const_width
8173                   = GET_MODE_BITSIZE (GET_MODE (comparison_value));
8174               if (comparison_const_width > HOST_BITS_PER_WIDE_INT)
8175                 comparison_const_width = HOST_BITS_PER_WIDE_INT;
8176               comparison_sign_mask
8177                 = (unsigned HOST_WIDE_INT) 1 << (comparison_const_width - 1);
8178
8179               /* If the comparison value is not a loop invariant, then we
8180                  can not reverse this loop.
8181
8182                  ??? If the insns which initialize the comparison value as
8183                  a whole compute an invariant result, then we could move
8184                  them out of the loop and proceed with loop reversal.  */
8185               if (! loop_invariant_p (loop, comparison_value))
8186                 return 0;
8187
8188               if (GET_CODE (comparison_value) == CONST_INT)
8189                 comparison_val = INTVAL (comparison_value);
8190               initial_value = bl->initial_value;
8191
8192               /* Normalize the initial value if it is an integer and
8193                  has no other use except as a counter.  This will allow
8194                  a few more loops to be reversed.  */
8195               if (no_use_except_counting
8196                   && GET_CODE (comparison_value) == CONST_INT
8197                   && GET_CODE (initial_value) == CONST_INT)
8198                 {
8199                   comparison_val = comparison_val - INTVAL (bl->initial_value);
8200                   /* The code below requires comparison_val to be a multiple
8201                      of add_val in order to do the loop reversal, so
8202                      round up comparison_val to a multiple of add_val.
8203                      Since comparison_value is constant, we know that the
8204                      current comparison code is LT.  */
8205                   comparison_val = comparison_val + add_val - 1;
8206                   comparison_val
8207                     -= (unsigned HOST_WIDE_INT) comparison_val % add_val;
8208                   /* We postpone overflow checks for COMPARISON_VAL here;
8209                      even if there is an overflow, we might still be able to
8210                      reverse the loop, if converting the loop exit test to
8211                      NE is possible.  */
8212                   initial_value = const0_rtx;
8213                 }
8214
8215               /* First check if we can do a vanilla loop reversal.  */
8216               if (initial_value == const0_rtx
8217                   /* If we have a decrement_and_branch_on_count,
8218                      prefer the NE test, since this will allow that
8219                      instruction to be generated.  Note that we must
8220                      use a vanilla loop reversal if the biv is used to
8221                      calculate a giv or has a non-counting use.  */
8222 #if ! defined (HAVE_decrement_and_branch_until_zero) \
8223 && defined (HAVE_decrement_and_branch_on_count)
8224                   && (! (add_val == 1 && loop->vtop
8225                          && (bl->biv_count == 0
8226                              || no_use_except_counting)))
8227 #endif
8228                   && GET_CODE (comparison_value) == CONST_INT
8229                      /* Now do postponed overflow checks on COMPARISON_VAL.  */
8230                   && ! (((comparison_val - add_val) ^ INTVAL (comparison_value))
8231                         & comparison_sign_mask))
8232                 {
8233                   /* Register will always be nonnegative, with value
8234                      0 on last iteration */
8235                   add_adjust = add_val;
8236                   nonneg = 1;
8237                   cmp_code = GE;
8238                 }
8239               else if (add_val == 1 && loop->vtop
8240                        && (bl->biv_count == 0
8241                            || no_use_except_counting))
8242                 {
8243                   add_adjust = 0;
8244                   cmp_code = NE;
8245                 }
8246               else
8247                 return 0;
8248
8249               if (GET_CODE (comparison) == LE)
8250                 add_adjust -= add_val;
8251
8252               /* If the initial value is not zero, or if the comparison
8253                  value is not an exact multiple of the increment, then we
8254                  can not reverse this loop.  */
8255               if (initial_value == const0_rtx
8256                   && GET_CODE (comparison_value) == CONST_INT)
8257                 {
8258                   if (((unsigned HOST_WIDE_INT) comparison_val % add_val) != 0)
8259                     return 0;
8260                 }
8261               else
8262                 {
8263                   if (! no_use_except_counting || add_val != 1)
8264                     return 0;
8265                 }
8266
8267               final_value = comparison_value;
8268
8269               /* Reset these in case we normalized the initial value
8270                  and comparison value above.  */
8271               if (GET_CODE (comparison_value) == CONST_INT
8272                   && GET_CODE (initial_value) == CONST_INT)
8273                 {
8274                   comparison_value = GEN_INT (comparison_val);
8275                   final_value
8276                     = GEN_INT (comparison_val + INTVAL (bl->initial_value));
8277                 }
8278               bl->initial_value = initial_value;
8279
8280               /* Save some info needed to produce the new insns.  */
8281               reg = bl->biv->dest_reg;
8282               jump_label = condjump_label (PREV_INSN (loop_end));
8283               new_add_val = GEN_INT (-INTVAL (bl->biv->add_val));
8284
8285               /* Set start_value; if this is not a CONST_INT, we need
8286                  to generate a SUB.
8287                  Initialize biv to start_value before loop start.
8288                  The old initializing insn will be deleted as a
8289                  dead store by flow.c.  */
8290               if (initial_value == const0_rtx
8291                   && GET_CODE (comparison_value) == CONST_INT)
8292                 {
8293                   start_value = GEN_INT (comparison_val - add_adjust);
8294                   loop_insn_hoist (loop, gen_move_insn (reg, start_value));
8295                 }
8296               else if (GET_CODE (initial_value) == CONST_INT)
8297                 {
8298                   enum machine_mode mode = GET_MODE (reg);
8299                   rtx offset = GEN_INT (-INTVAL (initial_value) - add_adjust);
8300                   rtx add_insn = gen_add3_insn (reg, comparison_value, offset);
8301
8302                   if (add_insn == 0)
8303                     return 0;
8304
8305                   start_value
8306                     = gen_rtx_PLUS (mode, comparison_value, offset);
8307                   loop_insn_hoist (loop, add_insn);
8308                   if (GET_CODE (comparison) == LE)
8309                     final_value = gen_rtx_PLUS (mode, comparison_value,
8310                                                 GEN_INT (add_val));
8311                 }
8312               else if (! add_adjust)
8313                 {
8314                   enum machine_mode mode = GET_MODE (reg);
8315                   rtx sub_insn = gen_sub3_insn (reg, comparison_value,
8316                                                 initial_value);
8317
8318                   if (sub_insn == 0)
8319                     return 0;
8320                   start_value
8321                     = gen_rtx_MINUS (mode, comparison_value, initial_value);
8322                   loop_insn_hoist (loop, sub_insn);
8323                 }
8324               else
8325                 /* We could handle the other cases too, but it'll be
8326                    better to have a testcase first.  */
8327                 return 0;
8328
8329               /* We may not have a single insn which can increment a reg, so
8330                  create a sequence to hold all the insns from expand_inc.  */
8331               start_sequence ();
8332               expand_inc (reg, new_add_val);
8333               tem = gen_sequence ();
8334               end_sequence ();
8335
8336               p = loop_insn_emit_before (loop, 0, bl->biv->insn, tem);
8337               delete_insn (bl->biv->insn);
8338
8339               /* Update biv info to reflect its new status.  */
8340               bl->biv->insn = p;
8341               bl->initial_value = start_value;
8342               bl->biv->add_val = new_add_val;
8343
8344               /* Update loop info.  */
8345               loop_info->initial_value = reg;
8346               loop_info->initial_equiv_value = reg;
8347               loop_info->final_value = const0_rtx;
8348               loop_info->final_equiv_value = const0_rtx;
8349               loop_info->comparison_value = const0_rtx;
8350               loop_info->comparison_code = cmp_code;
8351               loop_info->increment = new_add_val;
8352
8353               /* Inc LABEL_NUSES so that delete_insn will
8354                  not delete the label.  */
8355               LABEL_NUSES (XEXP (jump_label, 0))++;
8356
8357               /* Emit an insn after the end of the loop to set the biv's
8358                  proper exit value if it is used anywhere outside the loop.  */
8359               if ((REGNO_LAST_UID (bl->regno) != INSN_UID (first_compare))
8360                   || ! bl->init_insn
8361                   || REGNO_FIRST_UID (bl->regno) != INSN_UID (bl->init_insn))
8362                 loop_insn_sink (loop, gen_move_insn (reg, final_value));
8363
8364               /* Delete compare/branch at end of loop.  */
8365               delete_related_insns (PREV_INSN (loop_end));
8366               if (compare_and_branch == 2)
8367                 delete_related_insns (first_compare);
8368
8369               /* Add new compare/branch insn at end of loop.  */
8370               start_sequence ();
8371               emit_cmp_and_jump_insns (reg, const0_rtx, cmp_code, NULL_RTX,
8372                                        GET_MODE (reg), 0,
8373                                        XEXP (jump_label, 0));
8374               tem = gen_sequence ();
8375               end_sequence ();
8376               emit_jump_insn_before (tem, loop_end);
8377
8378               for (tem = PREV_INSN (loop_end);
8379                    tem && GET_CODE (tem) != JUMP_INSN;
8380                    tem = PREV_INSN (tem))
8381                 ;
8382
8383               if (tem)
8384                 JUMP_LABEL (tem) = XEXP (jump_label, 0);
8385
8386               if (nonneg)
8387                 {
8388                   if (tem)
8389                     {
8390                       /* Increment of LABEL_NUSES done above.  */
8391                       /* Register is now always nonnegative,
8392                          so add REG_NONNEG note to the branch.  */
8393                       REG_NOTES (tem) = gen_rtx_EXPR_LIST (REG_NONNEG, reg,
8394                                                            REG_NOTES (tem));
8395                     }
8396                   bl->nonneg = 1;
8397                 }
8398
8399               /* No insn may reference both the reversed and another biv or it
8400                  will fail (see comment near the top of the loop reversal
8401                  code).
8402                  Earlier on, we have verified that the biv has no use except
8403                  counting, or it is the only biv in this function.
8404                  However, the code that computes no_use_except_counting does
8405                  not verify reg notes.  It's possible to have an insn that
8406                  references another biv, and has a REG_EQUAL note with an
8407                  expression based on the reversed biv.  To avoid this case,
8408                  remove all REG_EQUAL notes based on the reversed biv
8409                  here.  */
8410               for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8411                 if (INSN_P (p))
8412                   {
8413                     rtx *pnote;
8414                     rtx set = single_set (p);
8415                     /* If this is a set of a GIV based on the reversed biv, any
8416                        REG_EQUAL notes should still be correct.  */
8417                     if (! set
8418                         || GET_CODE (SET_DEST (set)) != REG
8419                         || (size_t) REGNO (SET_DEST (set)) >= ivs->n_regs
8420                         || REG_IV_TYPE (ivs, REGNO (SET_DEST (set))) != GENERAL_INDUCT
8421                         || REG_IV_INFO (ivs, REGNO (SET_DEST (set)))->src_reg != bl->biv->src_reg)
8422                       for (pnote = &REG_NOTES (p); *pnote;)
8423                         {
8424                           if (REG_NOTE_KIND (*pnote) == REG_EQUAL
8425                               && reg_mentioned_p (regno_reg_rtx[bl->regno],
8426                                                   XEXP (*pnote, 0)))
8427                             *pnote = XEXP (*pnote, 1);
8428                           else
8429                             pnote = &XEXP (*pnote, 1);
8430                         }
8431                   }
8432
8433               /* Mark that this biv has been reversed.  Each giv which depends
8434                  on this biv, and which is also live past the end of the loop
8435                  will have to be fixed up.  */
8436
8437               bl->reversed = 1;
8438
8439               if (loop_dump_stream)
8440                 {
8441                   fprintf (loop_dump_stream, "Reversed loop");
8442                   if (bl->nonneg)
8443                     fprintf (loop_dump_stream, " and added reg_nonneg\n");
8444                   else
8445                     fprintf (loop_dump_stream, "\n");
8446                 }
8447
8448               return 1;
8449             }
8450         }
8451     }
8452
8453   return 0;
8454 }
8455 \f
8456 /* Verify whether the biv BL appears to be eliminable,
8457    based on the insns in the loop that refer to it.
8458
8459    If ELIMINATE_P is non-zero, actually do the elimination.
8460
8461    THRESHOLD and INSN_COUNT are from loop_optimize and are used to
8462    determine whether invariant insns should be placed inside or at the
8463    start of the loop.  */
8464
8465 static int
8466 maybe_eliminate_biv (loop, bl, eliminate_p, threshold, insn_count)
8467      const struct loop *loop;
8468      struct iv_class *bl;
8469      int eliminate_p;
8470      int threshold, insn_count;
8471 {
8472   struct loop_ivs *ivs = LOOP_IVS (loop);
8473   rtx reg = bl->biv->dest_reg;
8474   rtx p;
8475
8476   /* Scan all insns in the loop, stopping if we find one that uses the
8477      biv in a way that we cannot eliminate.  */
8478
8479   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
8480     {
8481       enum rtx_code code = GET_CODE (p);
8482       basic_block where_bb = 0;
8483       rtx where_insn = threshold >= insn_count ? 0 : p;
8484
8485       /* If this is a libcall that sets a giv, skip ahead to its end.  */
8486       if (GET_RTX_CLASS (code) == 'i')
8487         {
8488           rtx note = find_reg_note (p, REG_LIBCALL, NULL_RTX);
8489
8490           if (note)
8491             {
8492               rtx last = XEXP (note, 0);
8493               rtx set = single_set (last);
8494
8495               if (set && GET_CODE (SET_DEST (set)) == REG)
8496                 {
8497                   unsigned int regno = REGNO (SET_DEST (set));
8498
8499                   if (regno < ivs->n_regs
8500                       && REG_IV_TYPE (ivs, regno) == GENERAL_INDUCT
8501                       && REG_IV_INFO (ivs, regno)->src_reg == bl->biv->src_reg)
8502                     p = last;
8503                 }
8504             }
8505         }
8506       if ((code == INSN || code == JUMP_INSN || code == CALL_INSN)
8507           && reg_mentioned_p (reg, PATTERN (p))
8508           && ! maybe_eliminate_biv_1 (loop, PATTERN (p), p, bl,
8509                                       eliminate_p, where_bb, where_insn))
8510         {
8511           if (loop_dump_stream)
8512             fprintf (loop_dump_stream,
8513                      "Cannot eliminate biv %d: biv used in insn %d.\n",
8514                      bl->regno, INSN_UID (p));
8515           break;
8516         }
8517     }
8518
8519   if (p == loop->end)
8520     {
8521       if (loop_dump_stream)
8522         fprintf (loop_dump_stream, "biv %d %s eliminated.\n",
8523                  bl->regno, eliminate_p ? "was" : "can be");
8524       return 1;
8525     }
8526
8527   return 0;
8528 }
8529 \f
8530 /* INSN and REFERENCE are instructions in the same insn chain.
8531    Return non-zero if INSN is first.  */
8532
8533 int
8534 loop_insn_first_p (insn, reference)
8535      rtx insn, reference;
8536 {
8537   rtx p, q;
8538
8539   for (p = insn, q = reference;;)
8540     {
8541       /* Start with test for not first so that INSN == REFERENCE yields not
8542          first.  */
8543       if (q == insn || ! p)
8544         return 0;
8545       if (p == reference || ! q)
8546         return 1;
8547
8548       /* Either of P or Q might be a NOTE.  Notes have the same LUID as the
8549          previous insn, hence the <= comparison below does not work if
8550          P is a note.  */
8551       if (INSN_UID (p) < max_uid_for_loop
8552           && INSN_UID (q) < max_uid_for_loop
8553           && GET_CODE (p) != NOTE)
8554         return INSN_LUID (p) <= INSN_LUID (q);
8555
8556       if (INSN_UID (p) >= max_uid_for_loop
8557           || GET_CODE (p) == NOTE)
8558         p = NEXT_INSN (p);
8559       if (INSN_UID (q) >= max_uid_for_loop)
8560         q = NEXT_INSN (q);
8561     }
8562 }
8563
8564 /* We are trying to eliminate BIV in INSN using GIV.  Return non-zero if
8565    the offset that we have to take into account due to auto-increment /
8566    div derivation is zero.  */
8567 static int
8568 biv_elimination_giv_has_0_offset (biv, giv, insn)
8569      struct induction *biv, *giv;
8570      rtx insn;
8571 {
8572   /* If the giv V had the auto-inc address optimization applied
8573      to it, and INSN occurs between the giv insn and the biv
8574      insn, then we'd have to adjust the value used here.
8575      This is rare, so we don't bother to make this possible.  */
8576   if (giv->auto_inc_opt
8577       && ((loop_insn_first_p (giv->insn, insn)
8578            && loop_insn_first_p (insn, biv->insn))
8579           || (loop_insn_first_p (biv->insn, insn)
8580               && loop_insn_first_p (insn, giv->insn))))
8581     return 0;
8582
8583   return 1;
8584 }
8585
8586 /* If BL appears in X (part of the pattern of INSN), see if we can
8587    eliminate its use.  If so, return 1.  If not, return 0.
8588
8589    If BIV does not appear in X, return 1.
8590
8591    If ELIMINATE_P is non-zero, actually do the elimination.
8592    WHERE_INSN/WHERE_BB indicate where extra insns should be added.
8593    Depending on how many items have been moved out of the loop, it
8594    will either be before INSN (when WHERE_INSN is non-zero) or at the
8595    start of the loop (when WHERE_INSN is zero).  */
8596
8597 static int
8598 maybe_eliminate_biv_1 (loop, x, insn, bl, eliminate_p, where_bb, where_insn)
8599      const struct loop *loop;
8600      rtx x, insn;
8601      struct iv_class *bl;
8602      int eliminate_p;
8603      basic_block where_bb;
8604      rtx where_insn;
8605 {
8606   enum rtx_code code = GET_CODE (x);
8607   rtx reg = bl->biv->dest_reg;
8608   enum machine_mode mode = GET_MODE (reg);
8609   struct induction *v;
8610   rtx arg, tem;
8611 #ifdef HAVE_cc0
8612   rtx new;
8613 #endif
8614   int arg_operand;
8615   const char *fmt;
8616   int i, j;
8617
8618   switch (code)
8619     {
8620     case REG:
8621       /* If we haven't already been able to do something with this BIV,
8622          we can't eliminate it.  */
8623       if (x == reg)
8624         return 0;
8625       return 1;
8626
8627     case SET:
8628       /* If this sets the BIV, it is not a problem.  */
8629       if (SET_DEST (x) == reg)
8630         return 1;
8631
8632       /* If this is an insn that defines a giv, it is also ok because
8633          it will go away when the giv is reduced.  */
8634       for (v = bl->giv; v; v = v->next_iv)
8635         if (v->giv_type == DEST_REG && SET_DEST (x) == v->dest_reg)
8636           return 1;
8637
8638 #ifdef HAVE_cc0
8639       if (SET_DEST (x) == cc0_rtx && SET_SRC (x) == reg)
8640         {
8641           /* Can replace with any giv that was reduced and
8642              that has (MULT_VAL != 0) and (ADD_VAL == 0).
8643              Require a constant for MULT_VAL, so we know it's nonzero.
8644              ??? We disable this optimization to avoid potential
8645              overflows.  */
8646
8647           for (v = bl->giv; v; v = v->next_iv)
8648             if (GET_CODE (v->mult_val) == CONST_INT && v->mult_val != const0_rtx
8649                 && v->add_val == const0_rtx
8650                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8651                 && v->mode == mode
8652                 && 0)
8653               {
8654                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8655                   continue;
8656
8657                 if (! eliminate_p)
8658                   return 1;
8659
8660                 /* If the giv has the opposite direction of change,
8661                    then reverse the comparison.  */
8662                 if (INTVAL (v->mult_val) < 0)
8663                   new = gen_rtx_COMPARE (GET_MODE (v->new_reg),
8664                                          const0_rtx, v->new_reg);
8665                 else
8666                   new = v->new_reg;
8667
8668                 /* We can probably test that giv's reduced reg.  */
8669                 if (validate_change (insn, &SET_SRC (x), new, 0))
8670                   return 1;
8671               }
8672
8673           /* Look for a giv with (MULT_VAL != 0) and (ADD_VAL != 0);
8674              replace test insn with a compare insn (cmp REDUCED_GIV ADD_VAL).
8675              Require a constant for MULT_VAL, so we know it's nonzero.
8676              ??? Do this only if ADD_VAL is a pointer to avoid a potential
8677              overflow problem.  */
8678
8679           for (v = bl->giv; v; v = v->next_iv)
8680             if (GET_CODE (v->mult_val) == CONST_INT
8681                 && v->mult_val != const0_rtx
8682                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8683                 && v->mode == mode
8684                 && (GET_CODE (v->add_val) == SYMBOL_REF
8685                     || GET_CODE (v->add_val) == LABEL_REF
8686                     || GET_CODE (v->add_val) == CONST
8687                     || (GET_CODE (v->add_val) == REG
8688                         && REG_POINTER (v->add_val))))
8689               {
8690                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8691                   continue;
8692
8693                 if (! eliminate_p)
8694                   return 1;
8695
8696                 /* If the giv has the opposite direction of change,
8697                    then reverse the comparison.  */
8698                 if (INTVAL (v->mult_val) < 0)
8699                   new = gen_rtx_COMPARE (VOIDmode, copy_rtx (v->add_val),
8700                                          v->new_reg);
8701                 else
8702                   new = gen_rtx_COMPARE (VOIDmode, v->new_reg,
8703                                          copy_rtx (v->add_val));
8704
8705                 /* Replace biv with the giv's reduced register.  */
8706                 update_reg_last_use (v->add_val, insn);
8707                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
8708                   return 1;
8709
8710                 /* Insn doesn't support that constant or invariant.  Copy it
8711                    into a register (it will be a loop invariant.)  */
8712                 tem = gen_reg_rtx (GET_MODE (v->new_reg));
8713
8714                 loop_insn_emit_before (loop, 0, where_insn,
8715                                        gen_move_insn (tem,
8716                                                       copy_rtx (v->add_val)));
8717
8718                 /* Substitute the new register for its invariant value in
8719                    the compare expression.  */
8720                 XEXP (new, (INTVAL (v->mult_val) < 0) ? 0 : 1) = tem;
8721                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
8722                   return 1;
8723               }
8724         }
8725 #endif
8726       break;
8727
8728     case COMPARE:
8729     case EQ:  case NE:
8730     case GT:  case GE:  case GTU:  case GEU:
8731     case LT:  case LE:  case LTU:  case LEU:
8732       /* See if either argument is the biv.  */
8733       if (XEXP (x, 0) == reg)
8734         arg = XEXP (x, 1), arg_operand = 1;
8735       else if (XEXP (x, 1) == reg)
8736         arg = XEXP (x, 0), arg_operand = 0;
8737       else
8738         break;
8739
8740       if (CONSTANT_P (arg))
8741         {
8742           /* First try to replace with any giv that has constant positive
8743              mult_val and constant add_val.  We might be able to support
8744              negative mult_val, but it seems complex to do it in general.  */
8745
8746           for (v = bl->giv; v; v = v->next_iv)
8747             if (GET_CODE (v->mult_val) == CONST_INT
8748                 && INTVAL (v->mult_val) > 0
8749                 && (GET_CODE (v->add_val) == SYMBOL_REF
8750                     || GET_CODE (v->add_val) == LABEL_REF
8751                     || GET_CODE (v->add_val) == CONST
8752                     || (GET_CODE (v->add_val) == REG
8753                         && REG_POINTER (v->add_val)))
8754                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8755                 && v->mode == mode)
8756               {
8757                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8758                   continue;
8759
8760                 if (! eliminate_p)
8761                   return 1;
8762
8763                 /* Replace biv with the giv's reduced reg.  */
8764                 validate_change (insn, &XEXP (x, 1 - arg_operand), v->new_reg, 1);
8765
8766                 /* If all constants are actually constant integers and
8767                    the derived constant can be directly placed in the COMPARE,
8768                    do so.  */
8769                 if (GET_CODE (arg) == CONST_INT
8770                     && GET_CODE (v->mult_val) == CONST_INT
8771                     && GET_CODE (v->add_val) == CONST_INT)
8772                   {
8773                     validate_change (insn, &XEXP (x, arg_operand),
8774                                      GEN_INT (INTVAL (arg)
8775                                               * INTVAL (v->mult_val)
8776                                               + INTVAL (v->add_val)), 1);
8777                   }
8778                 else
8779                   {
8780                     /* Otherwise, load it into a register.  */
8781                     tem = gen_reg_rtx (mode);
8782                     loop_iv_add_mult_emit_before (loop, arg,
8783                                                   v->mult_val, v->add_val,
8784                                                   tem, where_bb, where_insn);
8785                     validate_change (insn, &XEXP (x, arg_operand), tem, 1);
8786                   }
8787                 if (apply_change_group ())
8788                   return 1;
8789               }
8790
8791           /* Look for giv with positive constant mult_val and nonconst add_val.
8792              Insert insns to calculate new compare value.
8793              ??? Turn this off due to possible overflow.  */
8794
8795           for (v = bl->giv; v; v = v->next_iv)
8796             if (GET_CODE (v->mult_val) == CONST_INT
8797                 && INTVAL (v->mult_val) > 0
8798                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8799                 && v->mode == mode
8800                 && 0)
8801               {
8802                 rtx tem;
8803
8804                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8805                   continue;
8806
8807                 if (! eliminate_p)
8808                   return 1;
8809
8810                 tem = gen_reg_rtx (mode);
8811
8812                 /* Replace biv with giv's reduced register.  */
8813                 validate_change (insn, &XEXP (x, 1 - arg_operand),
8814                                  v->new_reg, 1);
8815
8816                 /* Compute value to compare against.  */
8817                 loop_iv_add_mult_emit_before (loop, arg,
8818                                               v->mult_val, v->add_val,
8819                                               tem, where_bb, where_insn);
8820                 /* Use it in this insn.  */
8821                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
8822                 if (apply_change_group ())
8823                   return 1;
8824               }
8825         }
8826       else if (GET_CODE (arg) == REG || GET_CODE (arg) == MEM)
8827         {
8828           if (loop_invariant_p (loop, arg) == 1)
8829             {
8830               /* Look for giv with constant positive mult_val and nonconst
8831                  add_val. Insert insns to compute new compare value.
8832                  ??? Turn this off due to possible overflow.  */
8833
8834               for (v = bl->giv; v; v = v->next_iv)
8835                 if (GET_CODE (v->mult_val) == CONST_INT && INTVAL (v->mult_val) > 0
8836                     && ! v->ignore && ! v->maybe_dead && v->always_computable
8837                     && v->mode == mode
8838                     && 0)
8839                   {
8840                     rtx tem;
8841
8842                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8843                       continue;
8844
8845                     if (! eliminate_p)
8846                       return 1;
8847
8848                     tem = gen_reg_rtx (mode);
8849
8850                     /* Replace biv with giv's reduced register.  */
8851                     validate_change (insn, &XEXP (x, 1 - arg_operand),
8852                                      v->new_reg, 1);
8853
8854                     /* Compute value to compare against.  */
8855                     loop_iv_add_mult_emit_before (loop, arg,
8856                                                   v->mult_val, v->add_val,
8857                                                   tem, where_bb, where_insn);
8858                     validate_change (insn, &XEXP (x, arg_operand), tem, 1);
8859                     if (apply_change_group ())
8860                       return 1;
8861                   }
8862             }
8863
8864           /* This code has problems.  Basically, you can't know when
8865              seeing if we will eliminate BL, whether a particular giv
8866              of ARG will be reduced.  If it isn't going to be reduced,
8867              we can't eliminate BL.  We can try forcing it to be reduced,
8868              but that can generate poor code.
8869
8870              The problem is that the benefit of reducing TV, below should
8871              be increased if BL can actually be eliminated, but this means
8872              we might have to do a topological sort of the order in which
8873              we try to process biv.  It doesn't seem worthwhile to do
8874              this sort of thing now.  */
8875
8876 #if 0
8877           /* Otherwise the reg compared with had better be a biv.  */
8878           if (GET_CODE (arg) != REG
8879               || REG_IV_TYPE (ivs, REGNO (arg)) != BASIC_INDUCT)
8880             return 0;
8881
8882           /* Look for a pair of givs, one for each biv,
8883              with identical coefficients.  */
8884           for (v = bl->giv; v; v = v->next_iv)
8885             {
8886               struct induction *tv;
8887
8888               if (v->ignore || v->maybe_dead || v->mode != mode)
8889                 continue;
8890
8891               for (tv = REG_IV_CLASS (ivs, REGNO (arg))->giv; tv;
8892                    tv = tv->next_iv)
8893                 if (! tv->ignore && ! tv->maybe_dead
8894                     && rtx_equal_p (tv->mult_val, v->mult_val)
8895                     && rtx_equal_p (tv->add_val, v->add_val)
8896                     && tv->mode == mode)
8897                   {
8898                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8899                       continue;
8900
8901                     if (! eliminate_p)
8902                       return 1;
8903
8904                     /* Replace biv with its giv's reduced reg.  */
8905                     XEXP (x, 1 - arg_operand) = v->new_reg;
8906                     /* Replace other operand with the other giv's
8907                        reduced reg.  */
8908                     XEXP (x, arg_operand) = tv->new_reg;
8909                     return 1;
8910                   }
8911             }
8912 #endif
8913         }
8914
8915       /* If we get here, the biv can't be eliminated.  */
8916       return 0;
8917
8918     case MEM:
8919       /* If this address is a DEST_ADDR giv, it doesn't matter if the
8920          biv is used in it, since it will be replaced.  */
8921       for (v = bl->giv; v; v = v->next_iv)
8922         if (v->giv_type == DEST_ADDR && v->location == &XEXP (x, 0))
8923           return 1;
8924       break;
8925
8926     default:
8927       break;
8928     }
8929
8930   /* See if any subexpression fails elimination.  */
8931   fmt = GET_RTX_FORMAT (code);
8932   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
8933     {
8934       switch (fmt[i])
8935         {
8936         case 'e':
8937           if (! maybe_eliminate_biv_1 (loop, XEXP (x, i), insn, bl,
8938                                        eliminate_p, where_bb, where_insn))
8939             return 0;
8940           break;
8941
8942         case 'E':
8943           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
8944             if (! maybe_eliminate_biv_1 (loop, XVECEXP (x, i, j), insn, bl,
8945                                          eliminate_p, where_bb, where_insn))
8946               return 0;
8947           break;
8948         }
8949     }
8950
8951   return 1;
8952 }
8953 \f
8954 /* Return nonzero if the last use of REG
8955    is in an insn following INSN in the same basic block.  */
8956
8957 static int
8958 last_use_this_basic_block (reg, insn)
8959      rtx reg;
8960      rtx insn;
8961 {
8962   rtx n;
8963   for (n = insn;
8964        n && GET_CODE (n) != CODE_LABEL && GET_CODE (n) != JUMP_INSN;
8965        n = NEXT_INSN (n))
8966     {
8967       if (REGNO_LAST_UID (REGNO (reg)) == INSN_UID (n))
8968         return 1;
8969     }
8970   return 0;
8971 }
8972 \f
8973 /* Called via `note_stores' to record the initial value of a biv.  Here we
8974    just record the location of the set and process it later.  */
8975
8976 static void
8977 record_initial (dest, set, data)
8978      rtx dest;
8979      rtx set;
8980      void *data ATTRIBUTE_UNUSED;
8981 {
8982   struct loop_ivs *ivs = (struct loop_ivs *) data;
8983   struct iv_class *bl;
8984
8985   if (GET_CODE (dest) != REG
8986       || REGNO (dest) >= ivs->n_regs
8987       || REG_IV_TYPE (ivs, REGNO (dest)) != BASIC_INDUCT)
8988     return;
8989
8990   bl = REG_IV_CLASS (ivs, REGNO (dest));
8991
8992   /* If this is the first set found, record it.  */
8993   if (bl->init_insn == 0)
8994     {
8995       bl->init_insn = note_insn;
8996       bl->init_set = set;
8997     }
8998 }
8999 \f
9000 /* If any of the registers in X are "old" and currently have a last use earlier
9001    than INSN, update them to have a last use of INSN.  Their actual last use
9002    will be the previous insn but it will not have a valid uid_luid so we can't
9003    use it.  X must be a source expression only.  */
9004
9005 static void
9006 update_reg_last_use (x, insn)
9007      rtx x;
9008      rtx insn;
9009 {
9010   /* Check for the case where INSN does not have a valid luid.  In this case,
9011      there is no need to modify the regno_last_uid, as this can only happen
9012      when code is inserted after the loop_end to set a pseudo's final value,
9013      and hence this insn will never be the last use of x.
9014      ???? This comment is not correct.  See for example loop_givs_reduce.
9015      This may insert an insn before another new insn.  */
9016   if (GET_CODE (x) == REG && REGNO (x) < max_reg_before_loop
9017       && INSN_UID (insn) < max_uid_for_loop
9018       && REGNO_LAST_LUID (REGNO (x)) < INSN_LUID (insn))
9019     {
9020       REGNO_LAST_UID (REGNO (x)) = INSN_UID (insn);
9021     }
9022   else
9023     {
9024       int i, j;
9025       const char *fmt = GET_RTX_FORMAT (GET_CODE (x));
9026       for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--)
9027         {
9028           if (fmt[i] == 'e')
9029             update_reg_last_use (XEXP (x, i), insn);
9030           else if (fmt[i] == 'E')
9031             for (j = XVECLEN (x, i) - 1; j >= 0; j--)
9032               update_reg_last_use (XVECEXP (x, i, j), insn);
9033         }
9034     }
9035 }
9036 \f
9037 /* Given an insn INSN and condition COND, return the condition in a
9038    canonical form to simplify testing by callers.  Specifically:
9039
9040    (1) The code will always be a comparison operation (EQ, NE, GT, etc.).
9041    (2) Both operands will be machine operands; (cc0) will have been replaced.
9042    (3) If an operand is a constant, it will be the second operand.
9043    (4) (LE x const) will be replaced with (LT x <const+1>) and similarly
9044        for GE, GEU, and LEU.
9045
9046    If the condition cannot be understood, or is an inequality floating-point
9047    comparison which needs to be reversed, 0 will be returned.
9048
9049    If REVERSE is non-zero, then reverse the condition prior to canonizing it.
9050
9051    If EARLIEST is non-zero, it is a pointer to a place where the earliest
9052    insn used in locating the condition was found.  If a replacement test
9053    of the condition is desired, it should be placed in front of that
9054    insn and we will be sure that the inputs are still valid.
9055
9056    If WANT_REG is non-zero, we wish the condition to be relative to that
9057    register, if possible.  Therefore, do not canonicalize the condition
9058    further.  */
9059
9060 rtx
9061 canonicalize_condition (insn, cond, reverse, earliest, want_reg)
9062      rtx insn;
9063      rtx cond;
9064      int reverse;
9065      rtx *earliest;
9066      rtx want_reg;
9067 {
9068   enum rtx_code code;
9069   rtx prev = insn;
9070   rtx set;
9071   rtx tem;
9072   rtx op0, op1;
9073   int reverse_code = 0;
9074   enum machine_mode mode;
9075
9076   code = GET_CODE (cond);
9077   mode = GET_MODE (cond);
9078   op0 = XEXP (cond, 0);
9079   op1 = XEXP (cond, 1);
9080
9081   if (reverse)
9082     code = reversed_comparison_code (cond, insn);
9083   if (code == UNKNOWN)
9084     return 0;
9085
9086   if (earliest)
9087     *earliest = insn;
9088
9089   /* If we are comparing a register with zero, see if the register is set
9090      in the previous insn to a COMPARE or a comparison operation.  Perform
9091      the same tests as a function of STORE_FLAG_VALUE as find_comparison_args
9092      in cse.c  */
9093
9094   while (GET_RTX_CLASS (code) == '<'
9095          && op1 == CONST0_RTX (GET_MODE (op0))
9096          && op0 != want_reg)
9097     {
9098       /* Set non-zero when we find something of interest.  */
9099       rtx x = 0;
9100
9101 #ifdef HAVE_cc0
9102       /* If comparison with cc0, import actual comparison from compare
9103          insn.  */
9104       if (op0 == cc0_rtx)
9105         {
9106           if ((prev = prev_nonnote_insn (prev)) == 0
9107               || GET_CODE (prev) != INSN
9108               || (set = single_set (prev)) == 0
9109               || SET_DEST (set) != cc0_rtx)
9110             return 0;
9111
9112           op0 = SET_SRC (set);
9113           op1 = CONST0_RTX (GET_MODE (op0));
9114           if (earliest)
9115             *earliest = prev;
9116         }
9117 #endif
9118
9119       /* If this is a COMPARE, pick up the two things being compared.  */
9120       if (GET_CODE (op0) == COMPARE)
9121         {
9122           op1 = XEXP (op0, 1);
9123           op0 = XEXP (op0, 0);
9124           continue;
9125         }
9126       else if (GET_CODE (op0) != REG)
9127         break;
9128
9129       /* Go back to the previous insn.  Stop if it is not an INSN.  We also
9130          stop if it isn't a single set or if it has a REG_INC note because
9131          we don't want to bother dealing with it.  */
9132
9133       if ((prev = prev_nonnote_insn (prev)) == 0
9134           || GET_CODE (prev) != INSN
9135           || FIND_REG_INC_NOTE (prev, NULL_RTX))
9136         break;
9137
9138       set = set_of (op0, prev);
9139
9140       if (set
9141           && (GET_CODE (set) != SET
9142               || !rtx_equal_p (SET_DEST (set), op0)))
9143         break;
9144
9145       /* If this is setting OP0, get what it sets it to if it looks
9146          relevant.  */
9147       if (set)
9148         {
9149           enum machine_mode inner_mode = GET_MODE (SET_DEST (set));
9150
9151           /* ??? We may not combine comparisons done in a CCmode with
9152              comparisons not done in a CCmode.  This is to aid targets
9153              like Alpha that have an IEEE compliant EQ instruction, and
9154              a non-IEEE compliant BEQ instruction.  The use of CCmode is
9155              actually artificial, simply to prevent the combination, but
9156              should not affect other platforms.
9157
9158              However, we must allow VOIDmode comparisons to match either
9159              CCmode or non-CCmode comparison, because some ports have
9160              modeless comparisons inside branch patterns.
9161
9162              ??? This mode check should perhaps look more like the mode check
9163              in simplify_comparison in combine.  */
9164
9165           if ((GET_CODE (SET_SRC (set)) == COMPARE
9166                || (((code == NE
9167                      || (code == LT
9168                          && GET_MODE_CLASS (inner_mode) == MODE_INT
9169                          && (GET_MODE_BITSIZE (inner_mode)
9170                              <= HOST_BITS_PER_WIDE_INT)
9171                          && (STORE_FLAG_VALUE
9172                              & ((HOST_WIDE_INT) 1
9173                                 << (GET_MODE_BITSIZE (inner_mode) - 1))))
9174 #ifdef FLOAT_STORE_FLAG_VALUE
9175                      || (code == LT
9176                          && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
9177                          && (REAL_VALUE_NEGATIVE
9178                              (FLOAT_STORE_FLAG_VALUE (inner_mode))))
9179 #endif
9180                      ))
9181                    && GET_RTX_CLASS (GET_CODE (SET_SRC (set))) == '<'))
9182               && (((GET_MODE_CLASS (mode) == MODE_CC)
9183                    == (GET_MODE_CLASS (inner_mode) == MODE_CC))
9184                   || mode == VOIDmode || inner_mode == VOIDmode))
9185             x = SET_SRC (set);
9186           else if (((code == EQ
9187                      || (code == GE
9188                          && (GET_MODE_BITSIZE (inner_mode)
9189                              <= HOST_BITS_PER_WIDE_INT)
9190                          && GET_MODE_CLASS (inner_mode) == MODE_INT
9191                          && (STORE_FLAG_VALUE
9192                              & ((HOST_WIDE_INT) 1
9193                                 << (GET_MODE_BITSIZE (inner_mode) - 1))))
9194 #ifdef FLOAT_STORE_FLAG_VALUE
9195                      || (code == GE
9196                          && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
9197                          && (REAL_VALUE_NEGATIVE
9198                              (FLOAT_STORE_FLAG_VALUE (inner_mode))))
9199 #endif
9200                      ))
9201                    && GET_RTX_CLASS (GET_CODE (SET_SRC (set))) == '<'
9202                    && (((GET_MODE_CLASS (mode) == MODE_CC)
9203                         == (GET_MODE_CLASS (inner_mode) == MODE_CC))
9204                        || mode == VOIDmode || inner_mode == VOIDmode))
9205
9206             {
9207               reverse_code = 1;
9208               x = SET_SRC (set);
9209             }
9210           else
9211             break;
9212         }
9213
9214       else if (reg_set_p (op0, prev))
9215         /* If this sets OP0, but not directly, we have to give up.  */
9216         break;
9217
9218       if (x)
9219         {
9220           if (GET_RTX_CLASS (GET_CODE (x)) == '<')
9221             code = GET_CODE (x);
9222           if (reverse_code)
9223             {
9224               code = reversed_comparison_code (x, prev);
9225               if (code == UNKNOWN)
9226                 return 0;
9227               reverse_code = 0;
9228             }
9229
9230           op0 = XEXP (x, 0), op1 = XEXP (x, 1);
9231           if (earliest)
9232             *earliest = prev;
9233         }
9234     }
9235
9236   /* If constant is first, put it last.  */
9237   if (CONSTANT_P (op0))
9238     code = swap_condition (code), tem = op0, op0 = op1, op1 = tem;
9239
9240   /* If OP0 is the result of a comparison, we weren't able to find what
9241      was really being compared, so fail.  */
9242   if (GET_MODE_CLASS (GET_MODE (op0)) == MODE_CC)
9243     return 0;
9244
9245   /* Canonicalize any ordered comparison with integers involving equality
9246      if we can do computations in the relevant mode and we do not
9247      overflow.  */
9248
9249   if (GET_CODE (op1) == CONST_INT
9250       && GET_MODE (op0) != VOIDmode
9251       && GET_MODE_BITSIZE (GET_MODE (op0)) <= HOST_BITS_PER_WIDE_INT)
9252     {
9253       HOST_WIDE_INT const_val = INTVAL (op1);
9254       unsigned HOST_WIDE_INT uconst_val = const_val;
9255       unsigned HOST_WIDE_INT max_val
9256         = (unsigned HOST_WIDE_INT) GET_MODE_MASK (GET_MODE (op0));
9257
9258       switch (code)
9259         {
9260         case LE:
9261           if ((unsigned HOST_WIDE_INT) const_val != max_val >> 1)
9262             code = LT, op1 = GEN_INT (const_val + 1);
9263           break;
9264
9265         /* When cross-compiling, const_val might be sign-extended from
9266            BITS_PER_WORD to HOST_BITS_PER_WIDE_INT */
9267         case GE:
9268           if ((HOST_WIDE_INT) (const_val & max_val)
9269               != (((HOST_WIDE_INT) 1
9270                    << (GET_MODE_BITSIZE (GET_MODE (op0)) - 1))))
9271             code = GT, op1 = GEN_INT (const_val - 1);
9272           break;
9273
9274         case LEU:
9275           if (uconst_val < max_val)
9276             code = LTU, op1 = GEN_INT (uconst_val + 1);
9277           break;
9278
9279         case GEU:
9280           if (uconst_val != 0)
9281             code = GTU, op1 = GEN_INT (uconst_val - 1);
9282           break;
9283
9284         default:
9285           break;
9286         }
9287     }
9288
9289 #ifdef HAVE_cc0
9290   /* Never return CC0; return zero instead.  */
9291   if (op0 == cc0_rtx)
9292     return 0;
9293 #endif
9294
9295   return gen_rtx_fmt_ee (code, VOIDmode, op0, op1);
9296 }
9297
9298 /* Given a jump insn JUMP, return the condition that will cause it to branch
9299    to its JUMP_LABEL.  If the condition cannot be understood, or is an
9300    inequality floating-point comparison which needs to be reversed, 0 will
9301    be returned.
9302
9303    If EARLIEST is non-zero, it is a pointer to a place where the earliest
9304    insn used in locating the condition was found.  If a replacement test
9305    of the condition is desired, it should be placed in front of that
9306    insn and we will be sure that the inputs are still valid.  */
9307
9308 rtx
9309 get_condition (jump, earliest)
9310      rtx jump;
9311      rtx *earliest;
9312 {
9313   rtx cond;
9314   int reverse;
9315   rtx set;
9316
9317   /* If this is not a standard conditional jump, we can't parse it.  */
9318   if (GET_CODE (jump) != JUMP_INSN
9319       || ! any_condjump_p (jump))
9320     return 0;
9321   set = pc_set (jump);
9322
9323   cond = XEXP (SET_SRC (set), 0);
9324
9325   /* If this branches to JUMP_LABEL when the condition is false, reverse
9326      the condition.  */
9327   reverse
9328     = GET_CODE (XEXP (SET_SRC (set), 2)) == LABEL_REF
9329       && XEXP (XEXP (SET_SRC (set), 2), 0) == JUMP_LABEL (jump);
9330
9331   return canonicalize_condition (jump, cond, reverse, earliest, NULL_RTX);
9332 }
9333
9334 /* Similar to above routine, except that we also put an invariant last
9335    unless both operands are invariants.  */
9336
9337 rtx
9338 get_condition_for_loop (loop, x)
9339      const struct loop *loop;
9340      rtx x;
9341 {
9342   rtx comparison = get_condition (x, (rtx*) 0);
9343
9344   if (comparison == 0
9345       || ! loop_invariant_p (loop, XEXP (comparison, 0))
9346       || loop_invariant_p (loop, XEXP (comparison, 1)))
9347     return comparison;
9348
9349   return gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)), VOIDmode,
9350                          XEXP (comparison, 1), XEXP (comparison, 0));
9351 }
9352
9353 /* Scan the function and determine whether it has indirect (computed) jumps.
9354
9355    This is taken mostly from flow.c; similar code exists elsewhere
9356    in the compiler.  It may be useful to put this into rtlanal.c.  */
9357 static int
9358 indirect_jump_in_function_p (start)
9359      rtx start;
9360 {
9361   rtx insn;
9362
9363   for (insn = start; insn; insn = NEXT_INSN (insn))
9364     if (computed_jump_p (insn))
9365       return 1;
9366
9367   return 0;
9368 }
9369
9370 /* Add MEM to the LOOP_MEMS array, if appropriate.  See the
9371    documentation for LOOP_MEMS for the definition of `appropriate'.
9372    This function is called from prescan_loop via for_each_rtx.  */
9373
9374 static int
9375 insert_loop_mem (mem, data)
9376      rtx *mem;
9377      void *data ATTRIBUTE_UNUSED;
9378 {
9379   struct loop_info *loop_info = data;
9380   int i;
9381   rtx m = *mem;
9382
9383   if (m == NULL_RTX)
9384     return 0;
9385
9386   switch (GET_CODE (m))
9387     {
9388     case MEM:
9389       break;
9390
9391     case CLOBBER:
9392       /* We're not interested in MEMs that are only clobbered.  */
9393       return -1;
9394
9395     case CONST_DOUBLE:
9396       /* We're not interested in the MEM associated with a
9397          CONST_DOUBLE, so there's no need to traverse into this.  */
9398       return -1;
9399
9400     case EXPR_LIST:
9401       /* We're not interested in any MEMs that only appear in notes.  */
9402       return -1;
9403
9404     default:
9405       /* This is not a MEM.  */
9406       return 0;
9407     }
9408
9409   /* See if we've already seen this MEM.  */
9410   for (i = 0; i < loop_info->mems_idx; ++i)
9411     if (rtx_equal_p (m, loop_info->mems[i].mem))
9412       {
9413         if (GET_MODE (m) != GET_MODE (loop_info->mems[i].mem))
9414           /* The modes of the two memory accesses are different.  If
9415              this happens, something tricky is going on, and we just
9416              don't optimize accesses to this MEM.  */
9417           loop_info->mems[i].optimize = 0;
9418
9419         return 0;
9420       }
9421
9422   /* Resize the array, if necessary.  */
9423   if (loop_info->mems_idx == loop_info->mems_allocated)
9424     {
9425       if (loop_info->mems_allocated != 0)
9426         loop_info->mems_allocated *= 2;
9427       else
9428         loop_info->mems_allocated = 32;
9429
9430       loop_info->mems = (loop_mem_info *)
9431         xrealloc (loop_info->mems,
9432                   loop_info->mems_allocated * sizeof (loop_mem_info));
9433     }
9434
9435   /* Actually insert the MEM.  */
9436   loop_info->mems[loop_info->mems_idx].mem = m;
9437   /* We can't hoist this MEM out of the loop if it's a BLKmode MEM
9438      because we can't put it in a register.  We still store it in the
9439      table, though, so that if we see the same address later, but in a
9440      non-BLK mode, we'll not think we can optimize it at that point.  */
9441   loop_info->mems[loop_info->mems_idx].optimize = (GET_MODE (m) != BLKmode);
9442   loop_info->mems[loop_info->mems_idx].reg = NULL_RTX;
9443   ++loop_info->mems_idx;
9444
9445   return 0;
9446 }
9447
9448
9449 /* Allocate REGS->ARRAY or reallocate it if it is too small.
9450
9451    Increment REGS->ARRAY[I].SET_IN_LOOP at the index I of each
9452    register that is modified by an insn between FROM and TO.  If the
9453    value of an element of REGS->array[I].SET_IN_LOOP becomes 127 or
9454    more, stop incrementing it, to avoid overflow.
9455
9456    Store in REGS->ARRAY[I].SINGLE_USAGE the single insn in which
9457    register I is used, if it is only used once.  Otherwise, it is set
9458    to 0 (for no uses) or const0_rtx for more than one use.  This
9459    parameter may be zero, in which case this processing is not done.
9460
9461    Set REGS->ARRAY[I].MAY_NOT_OPTIMIZE nonzero if we should not
9462    optimize register I.  */
9463
9464 static void
9465 loop_regs_scan (loop, extra_size)
9466      const struct loop *loop;
9467      int extra_size;
9468 {
9469   struct loop_regs *regs = LOOP_REGS (loop);
9470   int old_nregs;
9471   /* last_set[n] is nonzero iff reg n has been set in the current
9472    basic block.  In that case, it is the insn that last set reg n.  */
9473   rtx *last_set;
9474   rtx insn;
9475   int i;
9476
9477   old_nregs = regs->num;
9478   regs->num = max_reg_num ();
9479
9480   /* Grow the regs array if not allocated or too small.  */
9481   if (regs->num >= regs->size)
9482     {
9483       regs->size = regs->num + extra_size;
9484
9485       regs->array = (struct loop_reg *)
9486         xrealloc (regs->array, regs->size * sizeof (*regs->array));
9487
9488       /* Zero the new elements.  */
9489       memset (regs->array + old_nregs, 0,
9490               (regs->size - old_nregs) * sizeof (*regs->array));
9491     }
9492
9493   /* Clear previously scanned fields but do not clear n_times_set.  */
9494   for (i = 0; i < old_nregs; i++)
9495     {
9496       regs->array[i].set_in_loop = 0;
9497       regs->array[i].may_not_optimize = 0;
9498       regs->array[i].single_usage = NULL_RTX;
9499     }
9500
9501   last_set = (rtx *) xcalloc (regs->num, sizeof (rtx));
9502
9503   /* Scan the loop, recording register usage.  */
9504   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
9505        insn = NEXT_INSN (insn))
9506     {
9507       if (INSN_P (insn))
9508         {
9509           /* Record registers that have exactly one use.  */
9510           find_single_use_in_loop (regs, insn, PATTERN (insn));
9511
9512           /* Include uses in REG_EQUAL notes.  */
9513           if (REG_NOTES (insn))
9514             find_single_use_in_loop (regs, insn, REG_NOTES (insn));
9515
9516           if (GET_CODE (PATTERN (insn)) == SET
9517               || GET_CODE (PATTERN (insn)) == CLOBBER)
9518             count_one_set (regs, insn, PATTERN (insn), last_set);
9519           else if (GET_CODE (PATTERN (insn)) == PARALLEL)
9520             {
9521               int i;
9522               for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
9523                 count_one_set (regs, insn, XVECEXP (PATTERN (insn), 0, i),
9524                                last_set);
9525             }
9526         }
9527
9528       if (GET_CODE (insn) == CODE_LABEL || GET_CODE (insn) == JUMP_INSN)
9529         memset (last_set, 0, regs->num * sizeof (rtx));
9530     }
9531
9532   /* Invalidate all hard registers clobbered by calls.  With one exception:
9533      a call-clobbered PIC register is still function-invariant for our
9534      purposes, since we can hoist any PIC calculations out of the loop.
9535      Thus the call to rtx_varies_p.  */
9536   if (LOOP_INFO (loop)->has_call)
9537     for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
9538       if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i)
9539           && rtx_varies_p (gen_rtx_REG (Pmode, i), /*for_alias=*/1))
9540         {
9541           regs->array[i].may_not_optimize = 1;
9542           regs->array[i].set_in_loop = 1;
9543         }
9544
9545 #ifdef AVOID_CCMODE_COPIES
9546   /* Don't try to move insns which set CC registers if we should not
9547      create CCmode register copies.  */
9548   for (i = regs->num - 1; i >= FIRST_PSEUDO_REGISTER; i--)
9549     if (GET_MODE_CLASS (GET_MODE (regno_reg_rtx[i])) == MODE_CC)
9550       regs->array[i].may_not_optimize = 1;
9551 #endif
9552
9553   /* Set regs->array[I].n_times_set for the new registers.  */
9554   for (i = old_nregs; i < regs->num; i++)
9555     regs->array[i].n_times_set = regs->array[i].set_in_loop;
9556
9557   free (last_set);
9558 }
9559
9560 /* Returns the number of real INSNs in the LOOP.  */
9561
9562 static int
9563 count_insns_in_loop (loop)
9564      const struct loop *loop;
9565 {
9566   int count = 0;
9567   rtx insn;
9568
9569   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
9570        insn = NEXT_INSN (insn))
9571     if (INSN_P (insn))
9572       ++count;
9573
9574   return count;
9575 }
9576
9577 /* Move MEMs into registers for the duration of the loop.  */
9578
9579 static void
9580 load_mems (loop)
9581      const struct loop *loop;
9582 {
9583   struct loop_info *loop_info = LOOP_INFO (loop);
9584   struct loop_regs *regs = LOOP_REGS (loop);
9585   int maybe_never = 0;
9586   int i;
9587   rtx p, prev_ebb_head;
9588   rtx label = NULL_RTX;
9589   rtx end_label;
9590   /* Nonzero if the next instruction may never be executed.  */
9591   int next_maybe_never = 0;
9592   unsigned int last_max_reg = max_reg_num ();
9593
9594   if (loop_info->mems_idx == 0)
9595     return;
9596
9597   /* We cannot use next_label here because it skips over normal insns.  */
9598   end_label = next_nonnote_insn (loop->end);
9599   if (end_label && GET_CODE (end_label) != CODE_LABEL)
9600     end_label = NULL_RTX;
9601
9602   /* Check to see if it's possible that some instructions in the loop are
9603      never executed.  Also check if there is a goto out of the loop other
9604      than right after the end of the loop.  */
9605   for (p = next_insn_in_loop (loop, loop->scan_start);
9606        p != NULL_RTX;
9607        p = next_insn_in_loop (loop, p))
9608     {
9609       if (GET_CODE (p) == CODE_LABEL)
9610         maybe_never = 1;
9611       else if (GET_CODE (p) == JUMP_INSN
9612                /* If we enter the loop in the middle, and scan
9613                   around to the beginning, don't set maybe_never
9614                   for that.  This must be an unconditional jump,
9615                   otherwise the code at the top of the loop might
9616                   never be executed.  Unconditional jumps are
9617                   followed a by barrier then loop end.  */
9618                && ! (GET_CODE (p) == JUMP_INSN
9619                      && JUMP_LABEL (p) == loop->top
9620                      && NEXT_INSN (NEXT_INSN (p)) == loop->end
9621                      && any_uncondjump_p (p)))
9622         {
9623           /* If this is a jump outside of the loop but not right
9624              after the end of the loop, we would have to emit new fixup
9625              sequences for each such label.  */
9626           if (/* If we can't tell where control might go when this
9627                  JUMP_INSN is executed, we must be conservative.  */
9628               !JUMP_LABEL (p)
9629               || (JUMP_LABEL (p) != end_label
9630                   && (INSN_UID (JUMP_LABEL (p)) >= max_uid_for_loop
9631                       || INSN_LUID (JUMP_LABEL (p)) < INSN_LUID (loop->start)
9632                       || INSN_LUID (JUMP_LABEL (p)) > INSN_LUID (loop->end))))
9633             return;
9634
9635           if (!any_condjump_p (p))
9636             /* Something complicated.  */
9637             maybe_never = 1;
9638           else
9639             /* If there are any more instructions in the loop, they
9640                might not be reached.  */
9641             next_maybe_never = 1;
9642         }
9643       else if (next_maybe_never)
9644         maybe_never = 1;
9645     }
9646
9647   /* Find start of the extended basic block that enters the loop.  */
9648   for (p = loop->start;
9649        PREV_INSN (p) && GET_CODE (p) != CODE_LABEL;
9650        p = PREV_INSN (p))
9651     ;
9652   prev_ebb_head = p;
9653
9654   cselib_init ();
9655
9656   /* Build table of mems that get set to constant values before the
9657      loop.  */
9658   for (; p != loop->start; p = NEXT_INSN (p))
9659     cselib_process_insn (p);
9660
9661   /* Actually move the MEMs.  */
9662   for (i = 0; i < loop_info->mems_idx; ++i)
9663     {
9664       regset_head load_copies;
9665       regset_head store_copies;
9666       int written = 0;
9667       rtx reg;
9668       rtx mem = loop_info->mems[i].mem;
9669       rtx mem_list_entry;
9670
9671       if (MEM_VOLATILE_P (mem)
9672           || loop_invariant_p (loop, XEXP (mem, 0)) != 1)
9673         /* There's no telling whether or not MEM is modified.  */
9674         loop_info->mems[i].optimize = 0;
9675
9676       /* Go through the MEMs written to in the loop to see if this
9677          one is aliased by one of them.  */
9678       mem_list_entry = loop_info->store_mems;
9679       while (mem_list_entry)
9680         {
9681           if (rtx_equal_p (mem, XEXP (mem_list_entry, 0)))
9682             written = 1;
9683           else if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
9684                                     mem, rtx_varies_p))
9685             {
9686               /* MEM is indeed aliased by this store.  */
9687               loop_info->mems[i].optimize = 0;
9688               break;
9689             }
9690           mem_list_entry = XEXP (mem_list_entry, 1);
9691         }
9692
9693       if (flag_float_store && written
9694           && GET_MODE_CLASS (GET_MODE (mem)) == MODE_FLOAT)
9695         loop_info->mems[i].optimize = 0;
9696
9697       /* If this MEM is written to, we must be sure that there
9698          are no reads from another MEM that aliases this one.  */
9699       if (loop_info->mems[i].optimize && written)
9700         {
9701           int j;
9702
9703           for (j = 0; j < loop_info->mems_idx; ++j)
9704             {
9705               if (j == i)
9706                 continue;
9707               else if (true_dependence (mem,
9708                                         VOIDmode,
9709                                         loop_info->mems[j].mem,
9710                                         rtx_varies_p))
9711                 {
9712                   /* It's not safe to hoist loop_info->mems[i] out of
9713                      the loop because writes to it might not be
9714                      seen by reads from loop_info->mems[j].  */
9715                   loop_info->mems[i].optimize = 0;
9716                   break;
9717                 }
9718             }
9719         }
9720
9721       if (maybe_never && may_trap_p (mem))
9722         /* We can't access the MEM outside the loop; it might
9723            cause a trap that wouldn't have happened otherwise.  */
9724         loop_info->mems[i].optimize = 0;
9725
9726       if (!loop_info->mems[i].optimize)
9727         /* We thought we were going to lift this MEM out of the
9728            loop, but later discovered that we could not.  */
9729         continue;
9730
9731       INIT_REG_SET (&load_copies);
9732       INIT_REG_SET (&store_copies);
9733
9734       /* Allocate a pseudo for this MEM.  We set REG_USERVAR_P in
9735          order to keep scan_loop from moving stores to this MEM
9736          out of the loop just because this REG is neither a
9737          user-variable nor used in the loop test.  */
9738       reg = gen_reg_rtx (GET_MODE (mem));
9739       REG_USERVAR_P (reg) = 1;
9740       loop_info->mems[i].reg = reg;
9741
9742       /* Now, replace all references to the MEM with the
9743          corresponding pseudos.  */
9744       maybe_never = 0;
9745       for (p = next_insn_in_loop (loop, loop->scan_start);
9746            p != NULL_RTX;
9747            p = next_insn_in_loop (loop, p))
9748         {
9749           if (INSN_P (p))
9750             {
9751               rtx set;
9752
9753               set = single_set (p);
9754
9755               /* See if this copies the mem into a register that isn't
9756                  modified afterwards.  We'll try to do copy propagation
9757                  a little further on.  */
9758               if (set
9759                   /* @@@ This test is _way_ too conservative.  */
9760                   && ! maybe_never
9761                   && GET_CODE (SET_DEST (set)) == REG
9762                   && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER
9763                   && REGNO (SET_DEST (set)) < last_max_reg
9764                   && regs->array[REGNO (SET_DEST (set))].n_times_set == 1
9765                   && rtx_equal_p (SET_SRC (set), mem))
9766                 SET_REGNO_REG_SET (&load_copies, REGNO (SET_DEST (set)));
9767
9768               /* See if this copies the mem from a register that isn't
9769                  modified afterwards.  We'll try to remove the
9770                  redundant copy later on by doing a little register
9771                  renaming and copy propagation.   This will help
9772                  to untangle things for the BIV detection code.  */
9773               if (set
9774                   && ! maybe_never
9775                   && GET_CODE (SET_SRC (set)) == REG
9776                   && REGNO (SET_SRC (set)) >= FIRST_PSEUDO_REGISTER
9777                   && REGNO (SET_SRC (set)) < last_max_reg
9778                   && regs->array[REGNO (SET_SRC (set))].n_times_set == 1
9779                   && rtx_equal_p (SET_DEST (set), mem))
9780                 SET_REGNO_REG_SET (&store_copies, REGNO (SET_SRC (set)));
9781
9782               /* Replace the memory reference with the shadow register.  */
9783               replace_loop_mems (p, loop_info->mems[i].mem,
9784                                  loop_info->mems[i].reg);
9785             }
9786
9787           if (GET_CODE (p) == CODE_LABEL
9788               || GET_CODE (p) == JUMP_INSN)
9789             maybe_never = 1;
9790         }
9791
9792       if (! apply_change_group ())
9793         /* We couldn't replace all occurrences of the MEM.  */
9794         loop_info->mems[i].optimize = 0;
9795       else
9796         {
9797           /* Load the memory immediately before LOOP->START, which is
9798              the NOTE_LOOP_BEG.  */
9799           cselib_val *e = cselib_lookup (mem, VOIDmode, 0);
9800           rtx set;
9801           rtx best = mem;
9802           int j;
9803           struct elt_loc_list *const_equiv = 0;
9804
9805           if (e)
9806             {
9807               struct elt_loc_list *equiv;
9808               struct elt_loc_list *best_equiv = 0;
9809               for (equiv = e->locs; equiv; equiv = equiv->next)
9810                 {
9811                   if (CONSTANT_P (equiv->loc))
9812                     const_equiv = equiv;
9813                   else if (GET_CODE (equiv->loc) == REG
9814                            /* Extending hard register lifetimes causes crash
9815                               on SRC targets.  Doing so on non-SRC is
9816                               probably also not good idea, since we most
9817                               probably have pseudoregister equivalence as
9818                               well.  */
9819                            && REGNO (equiv->loc) >= FIRST_PSEUDO_REGISTER)
9820                     best_equiv = equiv;
9821                 }
9822               /* Use the constant equivalence if that is cheap enough.  */
9823               if (! best_equiv)
9824                 best_equiv = const_equiv;
9825               else if (const_equiv
9826                        && (rtx_cost (const_equiv->loc, SET)
9827                            <= rtx_cost (best_equiv->loc, SET)))
9828                 {
9829                   best_equiv = const_equiv;
9830                   const_equiv = 0;
9831                 }
9832
9833               /* If best_equiv is nonzero, we know that MEM is set to a
9834                  constant or register before the loop.  We will use this
9835                  knowledge to initialize the shadow register with that
9836                  constant or reg rather than by loading from MEM.  */
9837               if (best_equiv)
9838                 best = copy_rtx (best_equiv->loc);
9839             }
9840
9841           set = gen_move_insn (reg, best);
9842           set = loop_insn_hoist (loop, set);
9843           if (REG_P (best))
9844             {
9845               for (p = prev_ebb_head; p != loop->start; p = NEXT_INSN (p))
9846                 if (REGNO_LAST_UID (REGNO (best)) == INSN_UID (p))
9847                   {
9848                     REGNO_LAST_UID (REGNO (best)) = INSN_UID (set);
9849                     break;
9850                   }
9851             }
9852
9853           if (const_equiv)
9854             set_unique_reg_note (set, REG_EQUAL, copy_rtx (const_equiv->loc));
9855
9856           if (written)
9857             {
9858               if (label == NULL_RTX)
9859                 {
9860                   label = gen_label_rtx ();
9861                   emit_label_after (label, loop->end);
9862                 }
9863
9864               /* Store the memory immediately after END, which is
9865                  the NOTE_LOOP_END.  */
9866               set = gen_move_insn (copy_rtx (mem), reg);
9867               loop_insn_emit_after (loop, 0, label, set);
9868             }
9869
9870           if (loop_dump_stream)
9871             {
9872               fprintf (loop_dump_stream, "Hoisted regno %d %s from ",
9873                        REGNO (reg), (written ? "r/w" : "r/o"));
9874               print_rtl (loop_dump_stream, mem);
9875               fputc ('\n', loop_dump_stream);
9876             }
9877
9878           /* Attempt a bit of copy propagation.  This helps untangle the
9879              data flow, and enables {basic,general}_induction_var to find
9880              more bivs/givs.  */
9881           EXECUTE_IF_SET_IN_REG_SET
9882             (&load_copies, FIRST_PSEUDO_REGISTER, j,
9883              {
9884                try_copy_prop (loop, reg, j);
9885              });
9886           CLEAR_REG_SET (&load_copies);
9887
9888           EXECUTE_IF_SET_IN_REG_SET
9889             (&store_copies, FIRST_PSEUDO_REGISTER, j,
9890              {
9891                try_swap_copy_prop (loop, reg, j);
9892              });
9893           CLEAR_REG_SET (&store_copies);
9894         }
9895     }
9896
9897   if (label != NULL_RTX && end_label != NULL_RTX)
9898     {
9899       /* Now, we need to replace all references to the previous exit
9900          label with the new one.  */
9901       rtx_pair rr;
9902       rr.r1 = end_label;
9903       rr.r2 = label;
9904
9905       for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
9906         {
9907           for_each_rtx (&p, replace_label, &rr);
9908
9909           /* If this is a JUMP_INSN, then we also need to fix the JUMP_LABEL
9910              field.  This is not handled by for_each_rtx because it doesn't
9911              handle unprinted ('0') fields.  We need to update JUMP_LABEL
9912              because the immediately following unroll pass will use it.
9913              replace_label would not work anyways, because that only handles
9914              LABEL_REFs.  */
9915           if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p) == end_label)
9916             JUMP_LABEL (p) = label;
9917         }
9918     }
9919
9920   cselib_finish ();
9921 }
9922
9923 /* For communication between note_reg_stored and its caller.  */
9924 struct note_reg_stored_arg
9925 {
9926   int set_seen;
9927   rtx reg;
9928 };
9929
9930 /* Called via note_stores, record in SET_SEEN whether X, which is written,
9931    is equal to ARG.  */
9932 static void
9933 note_reg_stored (x, setter, arg)
9934      rtx x, setter ATTRIBUTE_UNUSED;
9935      void *arg;
9936 {
9937   struct note_reg_stored_arg *t = (struct note_reg_stored_arg *) arg;
9938   if (t->reg == x)
9939     t->set_seen = 1;
9940 }
9941
9942 /* Try to replace every occurrence of pseudo REGNO with REPLACEMENT.
9943    There must be exactly one insn that sets this pseudo; it will be
9944    deleted if all replacements succeed and we can prove that the register
9945    is not used after the loop.  */
9946
9947 static void
9948 try_copy_prop (loop, replacement, regno)
9949      const struct loop *loop;
9950      rtx replacement;
9951      unsigned int regno;
9952 {
9953   /* This is the reg that we are copying from.  */
9954   rtx reg_rtx = regno_reg_rtx[regno];
9955   rtx init_insn = 0;
9956   rtx insn;
9957   /* These help keep track of whether we replaced all uses of the reg.  */
9958   int replaced_last = 0;
9959   int store_is_first = 0;
9960
9961   for (insn = next_insn_in_loop (loop, loop->scan_start);
9962        insn != NULL_RTX;
9963        insn = next_insn_in_loop (loop, insn))
9964     {
9965       rtx set;
9966
9967       /* Only substitute within one extended basic block from the initializing
9968          insn.  */
9969       if (GET_CODE (insn) == CODE_LABEL && init_insn)
9970         break;
9971
9972       if (! INSN_P (insn))
9973         continue;
9974
9975       /* Is this the initializing insn?  */
9976       set = single_set (insn);
9977       if (set
9978           && GET_CODE (SET_DEST (set)) == REG
9979           && REGNO (SET_DEST (set)) == regno)
9980         {
9981           if (init_insn)
9982             abort ();
9983
9984           init_insn = insn;
9985           if (REGNO_FIRST_UID (regno) == INSN_UID (insn))
9986             store_is_first = 1;
9987         }
9988
9989       /* Only substitute after seeing the initializing insn.  */
9990       if (init_insn && insn != init_insn)
9991         {
9992           struct note_reg_stored_arg arg;
9993
9994           replace_loop_regs (insn, reg_rtx, replacement);
9995           if (REGNO_LAST_UID (regno) == INSN_UID (insn))
9996             replaced_last = 1;
9997
9998           /* Stop replacing when REPLACEMENT is modified.  */
9999           arg.reg = replacement;
10000           arg.set_seen = 0;
10001           note_stores (PATTERN (insn), note_reg_stored, &arg);
10002           if (arg.set_seen)
10003             {
10004               rtx note = find_reg_note (insn, REG_EQUAL, NULL);
10005
10006               /* It is possible that we've turned previously valid REG_EQUAL to
10007                  invalid, as we change the REGNO to REPLACEMENT and unlike REGNO,
10008                  REPLACEMENT is modified, we get different meaning.  */
10009               if (note && reg_mentioned_p (replacement, XEXP (note, 0)))
10010                 remove_note (insn, note);
10011               break;
10012             }
10013         }
10014     }
10015   if (! init_insn)
10016     abort ();
10017   if (apply_change_group ())
10018     {
10019       if (loop_dump_stream)
10020         fprintf (loop_dump_stream, "  Replaced reg %d", regno);
10021       if (store_is_first && replaced_last)
10022         {
10023           rtx first;
10024           rtx retval_note;
10025
10026           /* Assume we're just deleting INIT_INSN.  */
10027           first = init_insn;
10028           /* Look for REG_RETVAL note.  If we're deleting the end of
10029              the libcall sequence, the whole sequence can go.  */
10030           retval_note = find_reg_note (init_insn, REG_RETVAL, NULL_RTX);
10031           /* If we found a REG_RETVAL note, find the first instruction
10032              in the sequence.  */
10033           if (retval_note)
10034             first = XEXP (retval_note, 0);
10035
10036           /* Delete the instructions.  */
10037           loop_delete_insns (first, init_insn);
10038         }
10039       if (loop_dump_stream)
10040         fprintf (loop_dump_stream, ".\n");
10041     }
10042 }
10043
10044 /* Replace all the instructions from FIRST up to and including LAST
10045    with NOTE_INSN_DELETED notes.  */
10046
10047 static void
10048 loop_delete_insns (first, last)
10049      rtx first;
10050      rtx last;
10051 {
10052   while (1)
10053     {
10054       if (loop_dump_stream)
10055         fprintf (loop_dump_stream, ", deleting init_insn (%d)",
10056                  INSN_UID (first));
10057       delete_insn (first);
10058
10059       /* If this was the LAST instructions we're supposed to delete,
10060          we're done.  */
10061       if (first == last)
10062         break;
10063
10064       first = NEXT_INSN (first);
10065     }
10066 }
10067
10068 /* Try to replace occurrences of pseudo REGNO with REPLACEMENT within
10069    loop LOOP if the order of the sets of these registers can be
10070    swapped.  There must be exactly one insn within the loop that sets
10071    this pseudo followed immediately by a move insn that sets
10072    REPLACEMENT with REGNO.  */
10073 static void
10074 try_swap_copy_prop (loop, replacement, regno)
10075      const struct loop *loop;
10076      rtx replacement;
10077      unsigned int regno;
10078 {
10079   rtx insn;
10080   rtx set = NULL_RTX;
10081   unsigned int new_regno;
10082
10083   new_regno = REGNO (replacement);
10084
10085   for (insn = next_insn_in_loop (loop, loop->scan_start);
10086        insn != NULL_RTX;
10087        insn = next_insn_in_loop (loop, insn))
10088     {
10089       /* Search for the insn that copies REGNO to NEW_REGNO?  */
10090       if (INSN_P (insn)
10091           && (set = single_set (insn))
10092           && GET_CODE (SET_DEST (set)) == REG
10093           && REGNO (SET_DEST (set)) == new_regno
10094           && GET_CODE (SET_SRC (set)) == REG
10095           && REGNO (SET_SRC (set)) == regno)
10096         break;
10097     }
10098
10099   if (insn != NULL_RTX)
10100     {
10101       rtx prev_insn;
10102       rtx prev_set;
10103
10104       /* Some DEF-USE info would come in handy here to make this
10105          function more general.  For now, just check the previous insn
10106          which is the most likely candidate for setting REGNO.  */
10107
10108       prev_insn = PREV_INSN (insn);
10109
10110       if (INSN_P (insn)
10111           && (prev_set = single_set (prev_insn))
10112           && GET_CODE (SET_DEST (prev_set)) == REG
10113           && REGNO (SET_DEST (prev_set)) == regno)
10114         {
10115           /* We have:
10116              (set (reg regno) (expr))
10117              (set (reg new_regno) (reg regno))
10118
10119              so try converting this to:
10120              (set (reg new_regno) (expr))
10121              (set (reg regno) (reg new_regno))
10122
10123              The former construct is often generated when a global
10124              variable used for an induction variable is shadowed by a
10125              register (NEW_REGNO).  The latter construct improves the
10126              chances of GIV replacement and BIV elimination.  */
10127
10128           validate_change (prev_insn, &SET_DEST (prev_set),
10129                            replacement, 1);
10130           validate_change (insn, &SET_DEST (set),
10131                            SET_SRC (set), 1);
10132           validate_change (insn, &SET_SRC (set),
10133                            replacement, 1);
10134
10135           if (apply_change_group ())
10136             {
10137               if (loop_dump_stream)
10138                 fprintf (loop_dump_stream,
10139                          "  Swapped set of reg %d at %d with reg %d at %d.\n",
10140                          regno, INSN_UID (insn),
10141                          new_regno, INSN_UID (prev_insn));
10142
10143               /* Update first use of REGNO.  */
10144               if (REGNO_FIRST_UID (regno) == INSN_UID (prev_insn))
10145                 REGNO_FIRST_UID (regno) = INSN_UID (insn);
10146
10147               /* Now perform copy propagation to hopefully
10148                  remove all uses of REGNO within the loop.  */
10149               try_copy_prop (loop, replacement, regno);
10150             }
10151         }
10152     }
10153 }
10154
10155 /* Replace MEM with its associated pseudo register.  This function is
10156    called from load_mems via for_each_rtx.  DATA is actually a pointer
10157    to a structure describing the instruction currently being scanned
10158    and the MEM we are currently replacing.  */
10159
10160 static int
10161 replace_loop_mem (mem, data)
10162      rtx *mem;
10163      void *data;
10164 {
10165   loop_replace_args *args = (loop_replace_args *) data;
10166   rtx m = *mem;
10167
10168   if (m == NULL_RTX)
10169     return 0;
10170
10171   switch (GET_CODE (m))
10172     {
10173     case MEM:
10174       break;
10175
10176     case CONST_DOUBLE:
10177       /* We're not interested in the MEM associated with a
10178          CONST_DOUBLE, so there's no need to traverse into one.  */
10179       return -1;
10180
10181     default:
10182       /* This is not a MEM.  */
10183       return 0;
10184     }
10185
10186   if (!rtx_equal_p (args->match, m))
10187     /* This is not the MEM we are currently replacing.  */
10188     return 0;
10189
10190   /* Actually replace the MEM.  */
10191   validate_change (args->insn, mem, args->replacement, 1);
10192
10193   return 0;
10194 }
10195
10196 static void
10197 replace_loop_mems (insn, mem, reg)
10198      rtx insn;
10199      rtx mem;
10200      rtx reg;
10201 {
10202   loop_replace_args args;
10203
10204   args.insn = insn;
10205   args.match = mem;
10206   args.replacement = reg;
10207
10208   for_each_rtx (&insn, replace_loop_mem, &args);
10209 }
10210
10211 /* Replace one register with another.  Called through for_each_rtx; PX points
10212    to the rtx being scanned.  DATA is actually a pointer to
10213    a structure of arguments.  */
10214
10215 static int
10216 replace_loop_reg (px, data)
10217      rtx *px;
10218      void *data;
10219 {
10220   rtx x = *px;
10221   loop_replace_args *args = (loop_replace_args *) data;
10222
10223   if (x == NULL_RTX)
10224     return 0;
10225
10226   if (x == args->match)
10227     validate_change (args->insn, px, args->replacement, 1);
10228
10229   return 0;
10230 }
10231
10232 static void
10233 replace_loop_regs (insn, reg, replacement)
10234      rtx insn;
10235      rtx reg;
10236      rtx replacement;
10237 {
10238   loop_replace_args args;
10239
10240   args.insn = insn;
10241   args.match = reg;
10242   args.replacement = replacement;
10243
10244   for_each_rtx (&insn, replace_loop_reg, &args);
10245 }
10246
10247 /* Replace occurrences of the old exit label for the loop with the new
10248    one.  DATA is an rtx_pair containing the old and new labels,
10249    respectively.  */
10250
10251 static int
10252 replace_label (x, data)
10253      rtx *x;
10254      void *data;
10255 {
10256   rtx l = *x;
10257   rtx old_label = ((rtx_pair *) data)->r1;
10258   rtx new_label = ((rtx_pair *) data)->r2;
10259
10260   if (l == NULL_RTX)
10261     return 0;
10262
10263   if (GET_CODE (l) != LABEL_REF)
10264     return 0;
10265
10266   if (XEXP (l, 0) != old_label)
10267     return 0;
10268
10269   XEXP (l, 0) = new_label;
10270   ++LABEL_NUSES (new_label);
10271   --LABEL_NUSES (old_label);
10272
10273   return 0;
10274 }
10275 \f
10276 /* Emit insn for PATTERN after WHERE_INSN in basic block WHERE_BB
10277    (ignored in the interim).  */
10278
10279 static rtx
10280 loop_insn_emit_after (loop, where_bb, where_insn, pattern)
10281      const struct loop *loop ATTRIBUTE_UNUSED;
10282      basic_block where_bb ATTRIBUTE_UNUSED;
10283      rtx where_insn;
10284      rtx pattern;
10285 {
10286   return emit_insn_after (pattern, where_insn);
10287 }
10288
10289
10290 /* If WHERE_INSN is non-zero emit insn for PATTERN before WHERE_INSN
10291    in basic block WHERE_BB (ignored in the interim) within the loop
10292    otherwise hoist PATTERN into the loop pre-header.  */
10293
10294 rtx
10295 loop_insn_emit_before (loop, where_bb, where_insn, pattern)
10296      const struct loop *loop;
10297      basic_block where_bb ATTRIBUTE_UNUSED;
10298      rtx where_insn;
10299      rtx pattern;
10300 {
10301   if (! where_insn)
10302     return loop_insn_hoist (loop, pattern);
10303   return emit_insn_before (pattern, where_insn);
10304 }
10305
10306
10307 /* Emit call insn for PATTERN before WHERE_INSN in basic block
10308    WHERE_BB (ignored in the interim) within the loop.  */
10309
10310 static rtx
10311 loop_call_insn_emit_before (loop, where_bb, where_insn, pattern)
10312      const struct loop *loop ATTRIBUTE_UNUSED;
10313      basic_block where_bb ATTRIBUTE_UNUSED;
10314      rtx where_insn;
10315      rtx pattern;
10316 {
10317   return emit_call_insn_before (pattern, where_insn);
10318 }
10319
10320
10321 /* Hoist insn for PATTERN into the loop pre-header.  */
10322
10323 rtx
10324 loop_insn_hoist (loop, pattern)
10325      const struct loop *loop;
10326      rtx pattern;
10327 {
10328   return loop_insn_emit_before (loop, 0, loop->start, pattern);
10329 }
10330
10331
10332 /* Hoist call insn for PATTERN into the loop pre-header.  */
10333
10334 static rtx
10335 loop_call_insn_hoist (loop, pattern)
10336      const struct loop *loop;
10337      rtx pattern;
10338 {
10339   return loop_call_insn_emit_before (loop, 0, loop->start, pattern);
10340 }
10341
10342
10343 /* Sink insn for PATTERN after the loop end.  */
10344
10345 rtx
10346 loop_insn_sink (loop, pattern)
10347      const struct loop *loop;
10348      rtx pattern;
10349 {
10350   return loop_insn_emit_before (loop, 0, loop->sink, pattern);
10351 }
10352
10353
10354 /* If the loop has multiple exits, emit insn for PATTERN before the
10355    loop to ensure that it will always be executed no matter how the
10356    loop exits.  Otherwise, emit the insn for PATTERN after the loop,
10357    since this is slightly more efficient.  */
10358
10359 static rtx
10360 loop_insn_sink_or_swim (loop, pattern)
10361      const struct loop *loop;
10362      rtx pattern;
10363 {
10364   if (loop->exit_count)
10365     return loop_insn_hoist (loop, pattern);
10366   else
10367     return loop_insn_sink (loop, pattern);
10368 }
10369 \f
10370 static void
10371 loop_ivs_dump (loop, file, verbose)
10372      const struct loop *loop;
10373      FILE *file;
10374      int verbose;
10375 {
10376   struct iv_class *bl;
10377   int iv_num = 0;
10378
10379   if (! loop || ! file)
10380     return;
10381
10382   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
10383     iv_num++;
10384
10385   fprintf (file, "Loop %d: %d IV classes\n", loop->num, iv_num);
10386
10387   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
10388     {
10389       loop_iv_class_dump (bl, file, verbose);
10390       fputc ('\n', file);
10391     }
10392 }
10393
10394
10395 static void
10396 loop_iv_class_dump (bl, file, verbose)
10397      const struct iv_class *bl;
10398      FILE *file;
10399      int verbose ATTRIBUTE_UNUSED;
10400 {
10401   struct induction *v;
10402   rtx incr;
10403   int i;
10404
10405   if (! bl || ! file)
10406     return;
10407
10408   fprintf (file, "IV class for reg %d, benefit %d\n",
10409            bl->regno, bl->total_benefit);
10410
10411   fprintf (file, " Init insn %d", INSN_UID (bl->init_insn));
10412   if (bl->initial_value)
10413     {
10414       fprintf (file, ", init val: ");
10415       print_simple_rtl (file, bl->initial_value);
10416     }
10417   if (bl->initial_test)
10418     {
10419       fprintf (file, ", init test: ");
10420       print_simple_rtl (file, bl->initial_test);
10421     }
10422   fputc ('\n', file);
10423
10424   if (bl->final_value)
10425     {
10426       fprintf (file, " Final val: ");
10427       print_simple_rtl (file, bl->final_value);
10428       fputc ('\n', file);
10429     }
10430
10431   if ((incr = biv_total_increment (bl)))
10432     {
10433       fprintf (file, " Total increment: ");
10434       print_simple_rtl (file, incr);
10435       fputc ('\n', file);
10436     }
10437
10438   /* List the increments.  */
10439   for (i = 0, v = bl->biv; v; v = v->next_iv, i++)
10440     {
10441       fprintf (file, " Inc%d: insn %d, incr: ", i, INSN_UID (v->insn));
10442       print_simple_rtl (file, v->add_val);
10443       fputc ('\n', file);
10444     }
10445
10446   /* List the givs.  */
10447   for (i = 0, v = bl->giv; v; v = v->next_iv, i++)
10448     {
10449       fprintf (file, " Giv%d: insn %d, benefit %d, ",
10450                i, INSN_UID (v->insn), v->benefit);
10451       if (v->giv_type == DEST_ADDR)
10452           print_simple_rtl (file, v->mem);
10453       else
10454           print_simple_rtl (file, single_set (v->insn));
10455       fputc ('\n', file);
10456     }
10457 }
10458
10459
10460 static void
10461 loop_biv_dump (v, file, verbose)
10462      const struct induction *v;
10463      FILE *file;
10464      int verbose;
10465 {
10466   if (! v || ! file)
10467     return;
10468
10469   fprintf (file,
10470            "Biv %d: insn %d",
10471            REGNO (v->dest_reg), INSN_UID (v->insn));
10472   fprintf (file, " const ");
10473   print_simple_rtl (file, v->add_val);
10474
10475   if (verbose && v->final_value)
10476     {
10477       fputc ('\n', file);
10478       fprintf (file, " final ");
10479       print_simple_rtl (file, v->final_value);
10480     }
10481
10482   fputc ('\n', file);
10483 }
10484
10485
10486 static void
10487 loop_giv_dump (v, file, verbose)
10488      const struct induction *v;
10489      FILE *file;
10490      int verbose;
10491 {
10492   if (! v || ! file)
10493     return;
10494
10495   if (v->giv_type == DEST_REG)
10496     fprintf (file, "Giv %d: insn %d",
10497              REGNO (v->dest_reg),  INSN_UID (v->insn));
10498   else
10499     fprintf (file, "Dest address: insn %d",
10500              INSN_UID (v->insn));
10501
10502   fprintf (file, " src reg %d benefit %d",
10503            REGNO (v->src_reg), v->benefit);
10504   fprintf (file, " lifetime %d",
10505            v->lifetime);
10506
10507   if (v->replaceable)
10508     fprintf (file, " replaceable");
10509
10510   if (v->no_const_addval)
10511     fprintf (file, " ncav");
10512
10513   if (v->ext_dependent)
10514     {
10515       switch (GET_CODE (v->ext_dependent))
10516         {
10517         case SIGN_EXTEND:
10518           fprintf (file, " ext se");
10519           break;
10520         case ZERO_EXTEND:
10521           fprintf (file, " ext ze");
10522           break;
10523         case TRUNCATE:
10524           fprintf (file, " ext tr");
10525           break;
10526         default:
10527           abort ();
10528         }
10529     }
10530
10531   fputc ('\n', file);
10532   fprintf (file, " mult ");
10533   print_simple_rtl (file, v->mult_val);
10534
10535   fputc ('\n', file);
10536   fprintf (file, " add  ");
10537   print_simple_rtl (file, v->add_val);
10538
10539   if (verbose && v->final_value)
10540     {
10541       fputc ('\n', file);
10542       fprintf (file, " final ");
10543       print_simple_rtl (file, v->final_value);
10544     }
10545
10546   fputc ('\n', file);
10547 }
10548
10549
10550 void
10551 debug_ivs (loop)
10552      const struct loop *loop;
10553 {
10554   loop_ivs_dump (loop, stderr, 1);
10555 }
10556
10557
10558 void
10559 debug_iv_class (bl)
10560      const struct iv_class *bl;
10561 {
10562   loop_iv_class_dump (bl, stderr, 1);
10563 }
10564
10565
10566 void
10567 debug_biv (v)
10568      const struct induction *v;
10569 {
10570   loop_biv_dump (v, stderr, 1);
10571 }
10572
10573
10574 void
10575 debug_giv (v)
10576      const struct induction *v;
10577 {
10578   loop_giv_dump (v, stderr, 1);
10579 }
10580
10581
10582 #define LOOP_BLOCK_NUM_1(INSN) \
10583 ((INSN) ? (BLOCK_FOR_INSN (INSN) ? BLOCK_NUM (INSN) : - 1) : -1)
10584
10585 /* The notes do not have an assigned block, so look at the next insn.  */
10586 #define LOOP_BLOCK_NUM(INSN) \
10587 ((INSN) ? (GET_CODE (INSN) == NOTE \
10588             ? LOOP_BLOCK_NUM_1 (next_nonnote_insn (INSN)) \
10589             : LOOP_BLOCK_NUM_1 (INSN)) \
10590         : -1)
10591
10592 #define LOOP_INSN_UID(INSN) ((INSN) ? INSN_UID (INSN) : -1)
10593
10594 static void
10595 loop_dump_aux (loop, file, verbose)
10596      const struct loop *loop;
10597      FILE *file;
10598      int verbose ATTRIBUTE_UNUSED;
10599 {
10600   rtx label;
10601
10602   if (! loop || ! file)
10603     return;
10604
10605   /* Print diagnostics to compare our concept of a loop with
10606      what the loop notes say.  */
10607   if (! PREV_INSN (loop->first->head)
10608       || GET_CODE (PREV_INSN (loop->first->head)) != NOTE
10609       || NOTE_LINE_NUMBER (PREV_INSN (loop->first->head))
10610       != NOTE_INSN_LOOP_BEG)
10611     fprintf (file, ";;  No NOTE_INSN_LOOP_BEG at %d\n",
10612              INSN_UID (PREV_INSN (loop->first->head)));
10613   if (! NEXT_INSN (loop->last->end)
10614       || GET_CODE (NEXT_INSN (loop->last->end)) != NOTE
10615       || NOTE_LINE_NUMBER (NEXT_INSN (loop->last->end))
10616       != NOTE_INSN_LOOP_END)
10617     fprintf (file, ";;  No NOTE_INSN_LOOP_END at %d\n",
10618              INSN_UID (NEXT_INSN (loop->last->end)));
10619
10620   if (loop->start)
10621     {
10622       fprintf (file,
10623                ";;  start %d (%d), cont dom %d (%d), cont %d (%d), vtop %d (%d), end %d (%d)\n",
10624                LOOP_BLOCK_NUM (loop->start),
10625                LOOP_INSN_UID (loop->start),
10626                LOOP_BLOCK_NUM (loop->cont),
10627                LOOP_INSN_UID (loop->cont),
10628                LOOP_BLOCK_NUM (loop->cont),
10629                LOOP_INSN_UID (loop->cont),
10630                LOOP_BLOCK_NUM (loop->vtop),
10631                LOOP_INSN_UID (loop->vtop),
10632                LOOP_BLOCK_NUM (loop->end),
10633                LOOP_INSN_UID (loop->end));
10634       fprintf (file, ";;  top %d (%d), scan start %d (%d)\n",
10635                LOOP_BLOCK_NUM (loop->top),
10636                LOOP_INSN_UID (loop->top),
10637                LOOP_BLOCK_NUM (loop->scan_start),
10638                LOOP_INSN_UID (loop->scan_start));
10639       fprintf (file, ";;  exit_count %d", loop->exit_count);
10640       if (loop->exit_count)
10641         {
10642           fputs (", labels:", file);
10643           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
10644             {
10645               fprintf (file, " %d ",
10646                        LOOP_INSN_UID (XEXP (label, 0)));
10647             }
10648         }
10649       fputs ("\n", file);
10650
10651       /* This can happen when a marked loop appears as two nested loops,
10652          say from while (a || b) {}.  The inner loop won't match
10653          the loop markers but the outer one will.  */
10654       if (LOOP_BLOCK_NUM (loop->cont) != loop->latch->index)
10655         fprintf (file, ";;  NOTE_INSN_LOOP_CONT not in loop latch\n");
10656     }
10657 }
10658
10659 /* Call this function from the debugger to dump LOOP.  */
10660
10661 void
10662 debug_loop (loop)
10663      const struct loop *loop;
10664 {
10665   flow_loop_dump (loop, stderr, loop_dump_aux, 1);
10666 }
10667
10668 /* Call this function from the debugger to dump LOOPS.  */
10669
10670 void
10671 debug_loops (loops)
10672      const struct loops *loops;
10673 {
10674   flow_loops_dump (loops, stderr, loop_dump_aux, 1);
10675 }