gcc/unroll.c

   1 /* Try to unroll loops, and split induction variables.
   2    Copyright (C) 1992, 1993, 1994, 1995, 1997, 1998, 1999, 2000, 2001, 2002
   3    Free Software Foundation, Inc.
   4    Contributed by James E. Wilson, Cygnus Support/UC Berkeley.
   5
   6 This file is part of GCC.
   7
   8 GCC is free software; you can redistribute it and/or modify it under
   9 the terms of the GNU General Public License as published by the Free
  10 Software Foundation; either version 2, or (at your option) any later
  11 version.
  12
  13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  16 for more details.
  17
  18 You should have received a copy of the GNU General Public License
  19 along with GCC; see the file COPYING.  If not, write to the Free
  20 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  21 02111-1307, USA.  */
  22
  23 /* Try to unroll a loop, and split induction variables.
  24
  25    Loops for which the number of iterations can be calculated exactly are
  26    handled specially.  If the number of iterations times the insn_count is
  27    less than MAX_UNROLLED_INSNS, then the loop is unrolled completely.
  28    Otherwise, we try to unroll the loop a number of times modulo the number
  29    of iterations, so that only one exit test will be needed.  It is unrolled
  30    a number of times approximately equal to MAX_UNROLLED_INSNS divided by
  31    the insn count.
  32
  33    Otherwise, if the number of iterations can be calculated exactly at
  34    run time, and the loop is always entered at the top, then we try to
  35    precondition the loop.  That is, at run time, calculate how many times
  36    the loop will execute, and then execute the loop body a few times so
  37    that the remaining iterations will be some multiple of 4 (or 2 if the
  38    loop is large).  Then fall through to a loop unrolled 4 (or 2) times,
  39    with only one exit test needed at the end of the loop.
  40
  41    Otherwise, if the number of iterations can not be calculated exactly,
  42    not even at run time, then we still unroll the loop a number of times
  43    approximately equal to MAX_UNROLLED_INSNS divided by the insn count,
  44    but there must be an exit test after each copy of the loop body.
  45
  46    For each induction variable, which is dead outside the loop (replaceable)
  47    or for which we can easily calculate the final value, if we can easily
  48    calculate its value at each place where it is set as a function of the
  49    current loop unroll count and the variable's value at loop entry, then
  50    the induction variable is split into `N' different variables, one for
  51    each copy of the loop body.  One variable is live across the backward
  52    branch, and the others are all calculated as a function of this variable.
  53    This helps eliminate data dependencies, and leads to further opportunities
  54    for cse.  */
  55
  56 /* Possible improvements follow:  */
  57
  58 /* ??? Add an extra pass somewhere to determine whether unrolling will
  59    give any benefit.  E.g. after generating all unrolled insns, compute the
  60    cost of all insns and compare against cost of insns in rolled loop.
  61
  62    - On traditional architectures, unrolling a non-constant bound loop
  63      is a win if there is a giv whose only use is in memory addresses, the
  64      memory addresses can be split, and hence giv increments can be
  65      eliminated.
  66    - It is also a win if the loop is executed many times, and preconditioning
  67      can be performed for the loop.
  68    Add code to check for these and similar cases.  */
  69
  70 /* ??? Improve control of which loops get unrolled.  Could use profiling
  71    info to only unroll the most commonly executed loops.  Perhaps have
  72    a user specifyable option to control the amount of code expansion,
  73    or the percent of loops to consider for unrolling.  Etc.  */
  74
  75 /* ??? Look at the register copies inside the loop to see if they form a
  76    simple permutation.  If so, iterate the permutation until it gets back to
  77    the start state.  This is how many times we should unroll the loop, for
  78    best results, because then all register copies can be eliminated.
  79    For example, the lisp nreverse function should be unrolled 3 times
  80    while (this)
  81      {
  82        next = this->cdr;
  83        this->cdr = prev;
  84        prev = this;
  85        this = next;
  86      }
  87
  88    ??? The number of times to unroll the loop may also be based on data
  89    references in the loop.  For example, if we have a loop that references
  90    x[i-1], x[i], and x[i+1], we should unroll it a multiple of 3 times.  */
  91
  92 /* ??? Add some simple linear equation solving capability so that we can
  93    determine the number of loop iterations for more complex loops.
  94    For example, consider this loop from gdb
  95    #define SWAP_TARGET_AND_HOST(buffer,len)
  96      {
  97        char tmp;
  98        char *p = (char *) buffer;
  99        char *q = ((char *) buffer) + len - 1;
 100        int iterations = (len + 1) >> 1;
 101        int i;
 102        for (p; p < q; p++, q--;)
 103          {
 104            tmp = *q;
 105            *q = *p;
 106            *p = tmp;
 107          }
 108      }
 109    Note that:
 110      start value = p = &buffer + current_iteration
 111      end value   = q = &buffer + len - 1 - current_iteration
 112    Given the loop exit test of "p < q", then there must be "q - p" iterations,
 113    set equal to zero and solve for number of iterations:
 114      q - p = len - 1 - 2*current_iteration = 0
 115      current_iteration = (len - 1) / 2
 116    Hence, there are (len - 1) / 2 (rounded up to the nearest integer)
 117    iterations of this loop.  */
 118
 119 /* ??? Currently, no labels are marked as loop invariant when doing loop
 120    unrolling.  This is because an insn inside the loop, that loads the address
 121    of a label inside the loop into a register, could be moved outside the loop
 122    by the invariant code motion pass if labels were invariant.  If the loop
 123    is subsequently unrolled, the code will be wrong because each unrolled
 124    body of the loop will use the same address, whereas each actually needs a
 125    different address.  A case where this happens is when a loop containing
 126    a switch statement is unrolled.
 127
 128    It would be better to let labels be considered invariant.  When we
 129    unroll loops here, check to see if any insns using a label local to the
 130    loop were moved before the loop.  If so, then correct the problem, by
 131    moving the insn back into the loop, or perhaps replicate the insn before
 132    the loop, one copy for each time the loop is unrolled.  */
 133
 134 #include "config.h"
 135 #include "system.h"
 136 #include "rtl.h"
 137 #include "tm_p.h"
 138 #include "insn-config.h"
 139 #include "integrate.h"
 140 #include "regs.h"
 141 #include "recog.h"
 142 #include "flags.h"
 143 #include "function.h"
 144 #include "expr.h"
 145 #include "loop.h"
 146 #include "toplev.h"
 147 #include "hard-reg-set.h"
 148 #include "basic-block.h"
 149 #include "predict.h"
 150 #include "params.h"
 151
 152 /* The prime factors looked for when trying to unroll a loop by some
 153    number which is modulo the total number of iterations.  Just checking
 154    for these 4 prime factors will find at least one factor for 75% of
 155    all numbers theoretically.  Practically speaking, this will succeed
 156    almost all of the time since loops are generally a multiple of 2
 157    and/or 5.  */
 158
 159 #define NUM_FACTORS 4
 160
 161 static struct _factor { const int factor; int count; }
 162 factors[NUM_FACTORS] = { {2, 0}, {3, 0}, {5, 0}, {7, 0}};
 163
 164 /* Describes the different types of loop unrolling performed.  */
 165
 166 enum unroll_types
 167 {
 168   UNROLL_COMPLETELY,
 169   UNROLL_MODULO,
 170   UNROLL_NAIVE
 171 };
 172
 173 /* Indexed by register number, if non-zero, then it contains a pointer
 174    to a struct induction for a DEST_REG giv which has been combined with
 175    one of more address givs.  This is needed because whenever such a DEST_REG
 176    giv is modified, we must modify the value of all split address givs
 177    that were combined with this DEST_REG giv.  */
 178
 179 static struct induction **addr_combined_regs;
 180
 181 /* Indexed by register number, if this is a splittable induction variable,
 182    then this will hold the current value of the register, which depends on the
 183    iteration number.  */
 184
 185 static rtx *splittable_regs;
 186
 187 /* Indexed by register number, if this is a splittable induction variable,
 188    then this will hold the number of instructions in the loop that modify
 189    the induction variable.  Used to ensure that only the last insn modifying
 190    a split iv will update the original iv of the dest.  */
 191
 192 static int *splittable_regs_updates;
 193
 194 /* Forward declarations.  */
 195
 196 static void init_reg_map PARAMS ((struct inline_remap *, int));
 197 static rtx calculate_giv_inc PARAMS ((rtx, rtx, unsigned int));
 198 static rtx initial_reg_note_copy PARAMS ((rtx, struct inline_remap *));
 199 static void final_reg_note_copy PARAMS ((rtx *, struct inline_remap *));
 200 static void copy_loop_body PARAMS ((struct loop *, rtx, rtx,
 201                                     struct inline_remap *, rtx, int,
 202                                     enum unroll_types, rtx, rtx, rtx, rtx));
 203 static int find_splittable_regs PARAMS ((const struct loop *,
 204                                          enum unroll_types, int));
 205 static int find_splittable_givs PARAMS ((const struct loop *,
 206                                          struct iv_class *, enum unroll_types,
 207                                          rtx, int));
 208 static int reg_dead_after_loop PARAMS ((const struct loop *, rtx));
 209 static rtx fold_rtx_mult_add PARAMS ((rtx, rtx, rtx, enum machine_mode));
 210 static int verify_addresses PARAMS ((struct induction *, rtx, int));
 211 static rtx remap_split_bivs PARAMS ((struct loop *, rtx));
 212 static rtx find_common_reg_term PARAMS ((rtx, rtx));
 213 static rtx subtract_reg_term PARAMS ((rtx, rtx));
 214 static rtx loop_find_equiv_value PARAMS ((const struct loop *, rtx));
 215 static rtx ujump_to_loop_cont PARAMS ((rtx, rtx));
 216
 217 /* Try to unroll one loop and split induction variables in the loop.
 218
 219    The loop is described by the arguments LOOP and INSN_COUNT.
 220    STRENGTH_REDUCTION_P indicates whether information generated in the
 221    strength reduction pass is available.
 222
 223    This function is intended to be called from within `strength_reduce'
 224    in loop.c.  */
 225
 226 void
 227 unroll_loop (loop, insn_count, strength_reduce_p)
 228      struct loop *loop;
 229      int insn_count;
 230      int strength_reduce_p;
 231 {
 232   struct loop_info *loop_info = LOOP_INFO (loop);
 233   struct loop_ivs *ivs = LOOP_IVS (loop);
 234   int i, j;
 235   unsigned int r;
 236   unsigned HOST_WIDE_INT temp;
 237   int unroll_number = 1;
 238   rtx copy_start, copy_end;
 239   rtx insn, sequence, pattern, tem;
 240   int max_labelno, max_insnno;
 241   rtx insert_before;
 242   struct inline_remap *map;
 243   char *local_label = NULL;
 244   char *local_regno;
 245   unsigned int max_local_regnum;
 246   unsigned int maxregnum;
 247   rtx exit_label = 0;
 248   rtx start_label;
 249   struct iv_class *bl;
 250   int splitting_not_safe = 0;
 251   enum unroll_types unroll_type = UNROLL_NAIVE;
 252   int loop_preconditioned = 0;
 253   rtx safety_label;
 254   /* This points to the last real insn in the loop, which should be either
 255      a JUMP_INSN (for conditional jumps) or a BARRIER (for unconditional
 256      jumps).  */
 257   rtx last_loop_insn;
 258   rtx loop_start = loop->start;
 259   rtx loop_end = loop->end;
 260
 261   /* Don't bother unrolling huge loops.  Since the minimum factor is
 262      two, loops greater than one half of MAX_UNROLLED_INSNS will never
 263      be unrolled.  */
 264   if (insn_count > MAX_UNROLLED_INSNS / 2)
 265     {
 266       if (loop_dump_stream)
 267         fprintf (loop_dump_stream, "Unrolling failure: Loop too big.\n");
 268       return;
 269     }
 270
 271   /* Determine type of unroll to perform.  Depends on the number of iterations
 272      and the size of the loop.  */
 273
 274   /* If there is no strength reduce info, then set
 275      loop_info->n_iterations to zero.  This can happen if
 276      strength_reduce can't find any bivs in the loop.  A value of zero
 277      indicates that the number of iterations could not be calculated.  */
 278
 279   if (! strength_reduce_p)
 280     loop_info->n_iterations = 0;
 281
 282   if (loop_dump_stream && loop_info->n_iterations > 0)
 283     {
 284       fputs ("Loop unrolling: ", loop_dump_stream);
 285       fprintf (loop_dump_stream, HOST_WIDE_INT_PRINT_DEC,
 286                loop_info->n_iterations);
 287       fputs (" iterations.\n", loop_dump_stream);
 288     }
 289
 290   /* Find and save a pointer to the last nonnote insn in the loop.  */
 291
 292   last_loop_insn = prev_nonnote_insn (loop_end);
 293
 294   /* Calculate how many times to unroll the loop.  Indicate whether or
 295      not the loop is being completely unrolled.  */
 296
 297   if (loop_info->n_iterations == 1)
 298     {
 299       /* Handle the case where the loop begins with an unconditional
 300          jump to the loop condition.  Make sure to delete the jump
 301          insn, otherwise the loop body will never execute.  */
 302
 303       rtx ujump = ujump_to_loop_cont (loop->start, loop->cont);
 304       if (ujump)
 305         delete_related_insns (ujump);
 306
 307       /* If number of iterations is exactly 1, then eliminate the compare and
 308          branch at the end of the loop since they will never be taken.
 309          Then return, since no other action is needed here.  */
 310
 311       /* If the last instruction is not a BARRIER or a JUMP_INSN, then
 312          don't do anything.  */
 313
 314       if (GET_CODE (last_loop_insn) == BARRIER)
 315         {
 316           /* Delete the jump insn.  This will delete the barrier also.  */
 317           delete_related_insns (PREV_INSN (last_loop_insn));
 318         }
 319       else if (GET_CODE (last_loop_insn) == JUMP_INSN)
 320         {
 321 #ifdef HAVE_cc0
 322           rtx prev = PREV_INSN (last_loop_insn);
 323 #endif
 324           delete_related_insns (last_loop_insn);
 325 #ifdef HAVE_cc0
 326           /* The immediately preceding insn may be a compare which must be
 327              deleted.  */
 328           if (only_sets_cc0_p (prev))
 329             delete_related_insns (prev);
 330 #endif
 331         }
 332
 333       /* Remove the loop notes since this is no longer a loop.  */
 334       if (loop->vtop)
 335         delete_related_insns (loop->vtop);
 336       if (loop->cont)
 337         delete_related_insns (loop->cont);
 338       if (loop_start)
 339         delete_related_insns (loop_start);
 340       if (loop_end)
 341         delete_related_insns (loop_end);
 342
 343       return;
 344     }
 345   else if (loop_info->n_iterations > 0
 346            /* Avoid overflow in the next expression.  */
 347            && loop_info->n_iterations < MAX_UNROLLED_INSNS
 348            && loop_info->n_iterations * insn_count < MAX_UNROLLED_INSNS)
 349     {
 350       unroll_number = loop_info->n_iterations;
 351       unroll_type = UNROLL_COMPLETELY;
 352     }
 353   else if (loop_info->n_iterations > 0)
 354     {
 355       /* Try to factor the number of iterations.  Don't bother with the
 356          general case, only using 2, 3, 5, and 7 will get 75% of all
 357          numbers theoretically, and almost all in practice.  */
 358
 359       for (i = 0; i < NUM_FACTORS; i++)
 360         factors[i].count = 0;
 361
 362       temp = loop_info->n_iterations;
 363       for (i = NUM_FACTORS - 1; i >= 0; i--)
 364         while (temp % factors[i].factor == 0)
 365           {
 366             factors[i].count++;
 367             temp = temp / factors[i].factor;
 368           }
 369
 370       /* Start with the larger factors first so that we generally
 371          get lots of unrolling.  */
 372
 373       unroll_number = 1;
 374       temp = insn_count;
 375       for (i = 3; i >= 0; i--)
 376         while (factors[i].count--)
 377           {
 378             if (temp * factors[i].factor < MAX_UNROLLED_INSNS)
 379               {
 380                 unroll_number *= factors[i].factor;
 381                 temp *= factors[i].factor;
 382               }
 383             else
 384               break;
 385           }
 386
 387       /* If we couldn't find any factors, then unroll as in the normal
 388          case.  */
 389       if (unroll_number == 1)
 390         {
 391           if (loop_dump_stream)
 392             fprintf (loop_dump_stream, "Loop unrolling: No factors found.\n");
 393         }
 394       else
 395         unroll_type = UNROLL_MODULO;
 396     }
 397
 398   /* Default case, calculate number of times to unroll loop based on its
 399      size.  */
 400   if (unroll_type == UNROLL_NAIVE)
 401     {
 402       if (8 * insn_count < MAX_UNROLLED_INSNS)
 403         unroll_number = 8;
 404       else if (4 * insn_count < MAX_UNROLLED_INSNS)
 405         unroll_number = 4;
 406       else
 407         unroll_number = 2;
 408     }
 409
 410   /* Now we know how many times to unroll the loop.  */
 411
 412   if (loop_dump_stream)
 413     fprintf (loop_dump_stream, "Unrolling loop %d times.\n", unroll_number);
 414
 415   if (unroll_type == UNROLL_COMPLETELY || unroll_type == UNROLL_MODULO)
 416     {
 417       /* Loops of these types can start with jump down to the exit condition
 418          in rare circumstances.
 419
 420          Consider a pair of nested loops where the inner loop is part
 421          of the exit code for the outer loop.
 422
 423          In this case jump.c will not duplicate the exit test for the outer
 424          loop, so it will start with a jump to the exit code.
 425
 426          Then consider if the inner loop turns out to iterate once and
 427          only once.  We will end up deleting the jumps associated with
 428          the inner loop.  However, the loop notes are not removed from
 429          the instruction stream.
 430
 431          And finally assume that we can compute the number of iterations
 432          for the outer loop.
 433
 434          In this case unroll may want to unroll the outer loop even though
 435          it starts with a jump to the outer loop's exit code.
 436
 437          We could try to optimize this case, but it hardly seems worth it.
 438          Just return without unrolling the loop in such cases.  */
 439
 440       insn = loop_start;
 441       while (GET_CODE (insn) != CODE_LABEL && GET_CODE (insn) != JUMP_INSN)
 442         insn = NEXT_INSN (insn);
 443       if (GET_CODE (insn) == JUMP_INSN)
 444         return;
 445     }
 446
 447   if (unroll_type == UNROLL_COMPLETELY)
 448     {
 449       /* Completely unrolling the loop:  Delete the compare and branch at
 450          the end (the last two instructions).   This delete must done at the
 451          very end of loop unrolling, to avoid problems with calls to
 452          back_branch_in_range_p, which is called by find_splittable_regs.
 453          All increments of splittable bivs/givs are changed to load constant
 454          instructions.  */
 455
 456       copy_start = loop_start;
 457
 458       /* Set insert_before to the instruction immediately after the JUMP_INSN
 459          (or BARRIER), so that any NOTEs between the JUMP_INSN and the end of
 460          the loop will be correctly handled by copy_loop_body.  */
 461       insert_before = NEXT_INSN (last_loop_insn);
 462
 463       /* Set copy_end to the insn before the jump at the end of the loop.  */
 464       if (GET_CODE (last_loop_insn) == BARRIER)
 465         copy_end = PREV_INSN (PREV_INSN (last_loop_insn));
 466       else if (GET_CODE (last_loop_insn) == JUMP_INSN)
 467         {
 468           copy_end = PREV_INSN (last_loop_insn);
 469 #ifdef HAVE_cc0
 470           /* The instruction immediately before the JUMP_INSN may be a compare
 471              instruction which we do not want to copy.  */
 472           if (sets_cc0_p (PREV_INSN (copy_end)))
 473             copy_end = PREV_INSN (copy_end);
 474 #endif
 475         }
 476       else
 477         {
 478           /* We currently can't unroll a loop if it doesn't end with a
 479              JUMP_INSN.  There would need to be a mechanism that recognizes
 480              this case, and then inserts a jump after each loop body, which
 481              jumps to after the last loop body.  */
 482           if (loop_dump_stream)
 483             fprintf (loop_dump_stream,
 484                      "Unrolling failure: loop does not end with a JUMP_INSN.\n");
 485           return;
 486         }
 487     }
 488   else if (unroll_type == UNROLL_MODULO)
 489     {
 490       /* Partially unrolling the loop:  The compare and branch at the end
 491          (the last two instructions) must remain.  Don't copy the compare
 492          and branch instructions at the end of the loop.  Insert the unrolled
 493          code immediately before the compare/branch at the end so that the
 494          code will fall through to them as before.  */
 495
 496       copy_start = loop_start;
 497
 498       /* Set insert_before to the jump insn at the end of the loop.
 499          Set copy_end to before the jump insn at the end of the loop.  */
 500       if (GET_CODE (last_loop_insn) == BARRIER)
 501         {
 502           insert_before = PREV_INSN (last_loop_insn);
 503           copy_end = PREV_INSN (insert_before);
 504         }
 505       else if (GET_CODE (last_loop_insn) == JUMP_INSN)
 506         {
 507           insert_before = last_loop_insn;
 508 #ifdef HAVE_cc0
 509           /* The instruction immediately before the JUMP_INSN may be a compare
 510              instruction which we do not want to copy or delete.  */
 511           if (sets_cc0_p (PREV_INSN (insert_before)))
 512             insert_before = PREV_INSN (insert_before);
 513 #endif
 514           copy_end = PREV_INSN (insert_before);
 515         }
 516       else
 517         {
 518           /* We currently can't unroll a loop if it doesn't end with a
 519              JUMP_INSN.  There would need to be a mechanism that recognizes
 520              this case, and then inserts a jump after each loop body, which
 521              jumps to after the last loop body.  */
 522           if (loop_dump_stream)
 523             fprintf (loop_dump_stream,
 524                      "Unrolling failure: loop does not end with a JUMP_INSN.\n");
 525           return;
 526         }
 527     }
 528   else
 529     {
 530       /* Normal case: Must copy the compare and branch instructions at the
 531          end of the loop.  */
 532
 533       if (GET_CODE (last_loop_insn) == BARRIER)
 534         {
 535           /* Loop ends with an unconditional jump and a barrier.
 536              Handle this like above, don't copy jump and barrier.
 537              This is not strictly necessary, but doing so prevents generating
 538              unconditional jumps to an immediately following label.
 539
 540              This will be corrected below if the target of this jump is
 541              not the start_label.  */
 542
 543           insert_before = PREV_INSN (last_loop_insn);
 544           copy_end = PREV_INSN (insert_before);
 545         }
 546       else if (GET_CODE (last_loop_insn) == JUMP_INSN)
 547         {
 548           /* Set insert_before to immediately after the JUMP_INSN, so that
 549              NOTEs at the end of the loop will be correctly handled by
 550              copy_loop_body.  */
 551           insert_before = NEXT_INSN (last_loop_insn);
 552           copy_end = last_loop_insn;
 553         }
 554       else
 555         {
 556           /* We currently can't unroll a loop if it doesn't end with a
 557              JUMP_INSN.  There would need to be a mechanism that recognizes
 558              this case, and then inserts a jump after each loop body, which
 559              jumps to after the last loop body.  */
 560           if (loop_dump_stream)
 561             fprintf (loop_dump_stream,
 562                      "Unrolling failure: loop does not end with a JUMP_INSN.\n");
 563           return;
 564         }
 565
 566       /* If copying exit test branches because they can not be eliminated,
 567          then must convert the fall through case of the branch to a jump past
 568          the end of the loop.  Create a label to emit after the loop and save
 569          it for later use.  Do not use the label after the loop, if any, since
 570          it might be used by insns outside the loop, or there might be insns
 571          added before it later by final_[bg]iv_value which must be after
 572          the real exit label.  */
 573       exit_label = gen_label_rtx ();
 574
 575       insn = loop_start;
 576       while (GET_CODE (insn) != CODE_LABEL && GET_CODE (insn) != JUMP_INSN)
 577         insn = NEXT_INSN (insn);
 578
 579       if (GET_CODE (insn) == JUMP_INSN)
 580         {
 581           /* The loop starts with a jump down to the exit condition test.
 582              Start copying the loop after the barrier following this
 583              jump insn.  */
 584           copy_start = NEXT_INSN (insn);
 585
 586           /* Splitting induction variables doesn't work when the loop is
 587              entered via a jump to the bottom, because then we end up doing
 588              a comparison against a new register for a split variable, but
 589              we did not execute the set insn for the new register because
 590              it was skipped over.  */
 591           splitting_not_safe = 1;
 592           if (loop_dump_stream)
 593             fprintf (loop_dump_stream,
 594                      "Splitting not safe, because loop not entered at top.\n");
 595         }
 596       else
 597         copy_start = loop_start;
 598     }
 599
 600   /* This should always be the first label in the loop.  */
 601   start_label = NEXT_INSN (copy_start);
 602   /* There may be a line number note and/or a loop continue note here.  */
 603   while (GET_CODE (start_label) == NOTE)
 604     start_label = NEXT_INSN (start_label);
 605   if (GET_CODE (start_label) != CODE_LABEL)
 606     {
 607       /* This can happen as a result of jump threading.  If the first insns in
 608          the loop test the same condition as the loop's backward jump, or the
 609          opposite condition, then the backward jump will be modified to point
 610          to elsewhere, and the loop's start label is deleted.
 611
 612          This case currently can not be handled by the loop unrolling code.  */
 613
 614       if (loop_dump_stream)
 615         fprintf (loop_dump_stream,
 616                  "Unrolling failure: unknown insns between BEG note and loop label.\n");
 617       return;
 618     }
 619   if (LABEL_NAME (start_label))
 620     {
 621       /* The jump optimization pass must have combined the original start label
 622          with a named label for a goto.  We can't unroll this case because
 623          jumps which go to the named label must be handled differently than
 624          jumps to the loop start, and it is impossible to differentiate them
 625          in this case.  */
 626       if (loop_dump_stream)
 627         fprintf (loop_dump_stream,
 628                  "Unrolling failure: loop start label is gone\n");
 629       return;
 630     }
 631
 632   if (unroll_type == UNROLL_NAIVE
 633       && GET_CODE (last_loop_insn) == BARRIER
 634       && GET_CODE (PREV_INSN (last_loop_insn)) == JUMP_INSN
 635       && start_label != JUMP_LABEL (PREV_INSN (last_loop_insn)))
 636     {
 637       /* In this case, we must copy the jump and barrier, because they will
 638          not be converted to jumps to an immediately following label.  */
 639
 640       insert_before = NEXT_INSN (last_loop_insn);
 641       copy_end = last_loop_insn;
 642     }
 643
 644   if (unroll_type == UNROLL_NAIVE
 645       && GET_CODE (last_loop_insn) == JUMP_INSN
 646       && start_label != JUMP_LABEL (last_loop_insn))
 647     {
 648       /* ??? The loop ends with a conditional branch that does not branch back
 649          to the loop start label.  In this case, we must emit an unconditional
 650          branch to the loop exit after emitting the final branch.
 651          copy_loop_body does not have support for this currently, so we
 652          give up.  It doesn't seem worthwhile to unroll anyways since
 653          unrolling would increase the number of branch instructions
 654          executed.  */
 655       if (loop_dump_stream)
 656         fprintf (loop_dump_stream,
 657                  "Unrolling failure: final conditional branch not to loop start\n");
 658       return;
 659     }
 660
 661   /* Allocate a translation table for the labels and insn numbers.
 662      They will be filled in as we copy the insns in the loop.  */
 663
 664   max_labelno = max_label_num ();
 665   max_insnno = get_max_uid ();
 666
 667   /* Various paths through the unroll code may reach the "egress" label
 668      without initializing fields within the map structure.
 669
 670      To be safe, we use xcalloc to zero the memory.  */
 671   map = (struct inline_remap *) xcalloc (1, sizeof (struct inline_remap));
 672
 673   /* Allocate the label map.  */
 674
 675   if (max_labelno > 0)
 676     {
 677       map->label_map = (rtx *) xcalloc (max_labelno, sizeof (rtx));
 678       local_label = (char *) xcalloc (max_labelno, sizeof (char));
 679     }
 680
 681   /* Search the loop and mark all local labels, i.e. the ones which have to
 682      be distinct labels when copied.  For all labels which might be
 683      non-local, set their label_map entries to point to themselves.
 684      If they happen to be local their label_map entries will be overwritten
 685      before the loop body is copied.  The label_map entries for local labels
 686      will be set to a different value each time the loop body is copied.  */
 687
 688   for (insn = copy_start; insn != loop_end; insn = NEXT_INSN (insn))
 689     {
 690       rtx note;
 691
 692       if (GET_CODE (insn) == CODE_LABEL)
 693         local_label[CODE_LABEL_NUMBER (insn)] = 1;
 694       else if (GET_CODE (insn) == JUMP_INSN)
 695         {
 696           if (JUMP_LABEL (insn))
 697             set_label_in_map (map,
 698                               CODE_LABEL_NUMBER (JUMP_LABEL (insn)),
 699                               JUMP_LABEL (insn));
 700           else if (GET_CODE (PATTERN (insn)) == ADDR_VEC
 701                    || GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC)
 702             {
 703               rtx pat = PATTERN (insn);
 704               int diff_vec_p = GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC;
 705               int len = XVECLEN (pat, diff_vec_p);
 706               rtx label;
 707
 708               for (i = 0; i < len; i++)
 709                 {
 710                   label = XEXP (XVECEXP (pat, diff_vec_p, i), 0);
 711                   set_label_in_map (map, CODE_LABEL_NUMBER (label), label);
 712                 }
 713             }
 714         }
 715       if ((note = find_reg_note (insn, REG_LABEL, NULL_RTX)))
 716         set_label_in_map (map, CODE_LABEL_NUMBER (XEXP (note, 0)),
 717                           XEXP (note, 0));
 718     }
 719
 720   /* Allocate space for the insn map.  */
 721
 722   map->insn_map = (rtx *) xmalloc (max_insnno * sizeof (rtx));
 723
 724   /* Set this to zero, to indicate that we are doing loop unrolling,
 725      not function inlining.  */
 726   map->inline_target = 0;
 727
 728   /* The register and constant maps depend on the number of registers
 729      present, so the final maps can't be created until after
 730      find_splittable_regs is called.  However, they are needed for
 731      preconditioning, so we create temporary maps when preconditioning
 732      is performed.  */
 733
 734   /* The preconditioning code may allocate two new pseudo registers.  */
 735   maxregnum = max_reg_num ();
 736
 737   /* local_regno is only valid for regnos < max_local_regnum.  */
 738   max_local_regnum = maxregnum;
 739
 740   /* Allocate and zero out the splittable_regs and addr_combined_regs
 741      arrays.  These must be zeroed here because they will be used if
 742      loop preconditioning is performed, and must be zero for that case.
 743
 744      It is safe to do this here, since the extra registers created by the
 745      preconditioning code and find_splittable_regs will never be used
 746      to access the splittable_regs[] and addr_combined_regs[] arrays.  */
 747
 748   splittable_regs = (rtx *) xcalloc (maxregnum, sizeof (rtx));
 749   splittable_regs_updates = (int *) xcalloc (maxregnum, sizeof (int));
 750   addr_combined_regs
 751     = (struct induction **) xcalloc (maxregnum, sizeof (struct induction *));
 752   local_regno = (char *) xcalloc (maxregnum, sizeof (char));
 753
 754   /* Mark all local registers, i.e. the ones which are referenced only
 755      inside the loop.  */
 756   if (INSN_UID (copy_end) < max_uid_for_loop)
 757     {
 758       int copy_start_luid = INSN_LUID (copy_start);
 759       int copy_end_luid = INSN_LUID (copy_end);
 760
 761       /* If a register is used in the jump insn, we must not duplicate it
 762          since it will also be used outside the loop.  */
 763       if (GET_CODE (copy_end) == JUMP_INSN)
 764         copy_end_luid--;
 765
 766       /* If we have a target that uses cc0, then we also must not duplicate
 767          the insn that sets cc0 before the jump insn, if one is present.  */
 768 #ifdef HAVE_cc0
 769       if (GET_CODE (copy_end) == JUMP_INSN
 770           && sets_cc0_p (PREV_INSN (copy_end)))
 771         copy_end_luid--;
 772 #endif
 773
 774       /* If copy_start points to the NOTE that starts the loop, then we must
 775          use the next luid, because invariant pseudo-regs moved out of the loop
 776          have their lifetimes modified to start here, but they are not safe
 777          to duplicate.  */
 778       if (copy_start == loop_start)
 779         copy_start_luid++;
 780
 781       /* If a pseudo's lifetime is entirely contained within this loop, then we
 782          can use a different pseudo in each unrolled copy of the loop.  This
 783          results in better code.  */
 784       /* We must limit the generic test to max_reg_before_loop, because only
 785          these pseudo registers have valid regno_first_uid info.  */
 786       for (r = FIRST_PSEUDO_REGISTER; r < max_reg_before_loop; ++r)
 787         if (REGNO_FIRST_UID (r) > 0 && REGNO_FIRST_UID (r) <= max_uid_for_loop
 788             && REGNO_FIRST_LUID (r) >= copy_start_luid
 789             && REGNO_LAST_UID (r) > 0 && REGNO_LAST_UID (r) <= max_uid_for_loop
 790             && REGNO_LAST_LUID (r) <= copy_end_luid)
 791           {
 792             /* However, we must also check for loop-carried dependencies.
 793                If the value the pseudo has at the end of iteration X is
 794                used by iteration X+1, then we can not use a different pseudo
 795                for each unrolled copy of the loop.  */
 796             /* A pseudo is safe if regno_first_uid is a set, and this
 797                set dominates all instructions from regno_first_uid to
 798                regno_last_uid.  */
 799             /* ??? This check is simplistic.  We would get better code if
 800                this check was more sophisticated.  */
 801             if (set_dominates_use (r, REGNO_FIRST_UID (r), REGNO_LAST_UID (r),
 802                                    copy_start, copy_end))
 803               local_regno[r] = 1;
 804
 805             if (loop_dump_stream)
 806               {
 807                 if (local_regno[r])
 808                   fprintf (loop_dump_stream, "Marked reg %d as local\n", r);
 809                 else
 810                   fprintf (loop_dump_stream, "Did not mark reg %d as local\n",
 811                            r);
 812               }
 813           }
 814     }
 815
 816   /* If this loop requires exit tests when unrolled, check to see if we
 817      can precondition the loop so as to make the exit tests unnecessary.
 818      Just like variable splitting, this is not safe if the loop is entered
 819      via a jump to the bottom.  Also, can not do this if no strength
 820      reduce info, because precondition_loop_p uses this info.  */
 821
 822   /* Must copy the loop body for preconditioning before the following
 823      find_splittable_regs call since that will emit insns which need to
 824      be after the preconditioned loop copies, but immediately before the
 825      unrolled loop copies.  */
 826
 827   /* Also, it is not safe to split induction variables for the preconditioned
 828      copies of the loop body.  If we split induction variables, then the code
 829      assumes that each induction variable can be represented as a function
 830      of its initial value and the loop iteration number.  This is not true
 831      in this case, because the last preconditioned copy of the loop body
 832      could be any iteration from the first up to the `unroll_number-1'th,
 833      depending on the initial value of the iteration variable.  Therefore
 834      we can not split induction variables here, because we can not calculate
 835      their value.  Hence, this code must occur before find_splittable_regs
 836      is called.  */
 837
 838   if (unroll_type == UNROLL_NAIVE && ! splitting_not_safe && strength_reduce_p)
 839     {
 840       rtx initial_value, final_value, increment;
 841       enum machine_mode mode;
 842
 843       if (precondition_loop_p (loop,
 844                                &initial_value, &final_value, &increment,
 845                                &mode))
 846         {
 847           rtx diff;
 848           rtx *labels;
 849           int abs_inc, neg_inc;
 850           enum rtx_code cc = loop_info->comparison_code;
 851           int less_p     = (cc == LE  || cc == LEU || cc == LT  || cc == LTU);
 852           int unsigned_p = (cc == LEU || cc == GEU || cc == LTU || cc == GTU);
 853
 854           map->reg_map = (rtx *) xmalloc (maxregnum * sizeof (rtx));
 855
 856           VARRAY_CONST_EQUIV_INIT (map->const_equiv_varray, maxregnum,
 857                                    "unroll_loop_precondition");
 858           global_const_equiv_varray = map->const_equiv_varray;
 859
 860           init_reg_map (map, maxregnum);
 861
 862           /* Limit loop unrolling to 4, since this will make 7 copies of
 863              the loop body.  */
 864           if (unroll_number > 4)
 865             unroll_number = 4;
 866
 867           /* Save the absolute value of the increment, and also whether or
 868              not it is negative.  */
 869           neg_inc = 0;
 870           abs_inc = INTVAL (increment);
 871           if (abs_inc < 0)
 872             {
 873               abs_inc = -abs_inc;
 874               neg_inc = 1;
 875             }
 876
 877           start_sequence ();
 878
 879           /* Final value may have form of (PLUS val1 const1_rtx).  We need
 880              to convert it into general operand, so compute the real value.  */
 881
 882           if (GET_CODE (final_value) == PLUS)
 883             {
 884               final_value = expand_simple_binop (mode, PLUS,
 885                                                  copy_rtx (XEXP (final_value, 0)),
 886                                                  copy_rtx (XEXP (final_value, 1)),
 887                                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
 888             }
 889           if (!nonmemory_operand (final_value, VOIDmode))
 890             final_value = force_reg (mode, copy_rtx (final_value));
 891
 892           /* Calculate the difference between the final and initial values.
 893              Final value may be a (plus (reg x) (const_int 1)) rtx.
 894              Let the following cse pass simplify this if initial value is
 895              a constant.
 896
 897              We must copy the final and initial values here to avoid
 898              improperly shared rtl.
 899
 900              We have to deal with for (i = 0; --i < 6;) type loops.
 901              For such loops the real final value is the first time the
 902              loop variable overflows, so the diff we calculate is the
 903              distance from the overflow value.  This is 0 or ~0 for
 904              unsigned loops depending on the direction, or INT_MAX,
 905              INT_MAX+1 for signed loops.  We really do not need the
 906              exact value, since we are only interested in the diff
 907              modulo the increment, and the increment is a power of 2,
 908              so we can pretend that the overflow value is 0/~0.  */
 909
 910           if (cc == NE || less_p != neg_inc)
 911             diff = expand_simple_binop (mode, MINUS, final_value,
 912                                         copy_rtx (initial_value), NULL_RTX, 0,
 913                                         OPTAB_LIB_WIDEN);
 914           else
 915             diff = expand_simple_unop (mode, neg_inc ? NOT : NEG,
 916                                        copy_rtx (initial_value), NULL_RTX, 0);
 917
 918           /* Now calculate (diff % (unroll * abs (increment))) by using an
 919              and instruction.  */
 920           diff = expand_simple_binop (GET_MODE (diff), AND, diff,
 921                                       GEN_INT (unroll_number * abs_inc - 1),
 922                                       NULL_RTX, 0, OPTAB_LIB_WIDEN);
 923
 924           /* Now emit a sequence of branches to jump to the proper precond
 925              loop entry point.  */
 926
 927           labels = (rtx *) xmalloc (sizeof (rtx) * unroll_number);
 928           for (i = 0; i < unroll_number; i++)
 929             labels[i] = gen_label_rtx ();
 930
 931           /* Check for the case where the initial value is greater than or
 932              equal to the final value.  In that case, we want to execute
 933              exactly one loop iteration.  The code below will fail for this
 934              case.  This check does not apply if the loop has a NE
 935              comparison at the end.  */
 936
 937           if (cc != NE)
 938             {
 939               rtx incremented_initval;
 940               incremented_initval = expand_simple_binop (mode, PLUS,
 941                                                          initial_value,
 942                                                          increment,
 943                                                          NULL_RTX, 0,
 944                                                          OPTAB_LIB_WIDEN);
 945               emit_cmp_and_jump_insns (incremented_initval, final_value,
 946                                        less_p ? GE : LE, NULL_RTX,
 947                                        mode, unsigned_p, labels[1]);
 948               predict_insn_def (get_last_insn (), PRED_LOOP_CONDITION,
 949                                 TAKEN);
 950               JUMP_LABEL (get_last_insn ()) = labels[1];
 951               LABEL_NUSES (labels[1])++;
 952             }
 953
 954           /* Assuming the unroll_number is 4, and the increment is 2, then
 955              for a negative increment:  for a positive increment:
 956              diff = 0,1   precond 0     diff = 0,7   precond 0
 957              diff = 2,3   precond 3     diff = 1,2   precond 1
 958              diff = 4,5   precond 2     diff = 3,4   precond 2
 959              diff = 6,7   precond 1     diff = 5,6   precond 3  */
 960
 961           /* We only need to emit (unroll_number - 1) branches here, the
 962              last case just falls through to the following code.  */
 963
 964           /* ??? This would give better code if we emitted a tree of branches
 965              instead of the current linear list of branches.  */
 966
 967           for (i = 0; i < unroll_number - 1; i++)
 968             {
 969               int cmp_const;
 970               enum rtx_code cmp_code;
 971
 972               /* For negative increments, must invert the constant compared
 973                  against, except when comparing against zero.  */
 974               if (i == 0)
 975                 {
 976                   cmp_const = 0;
 977                   cmp_code = EQ;
 978                 }
 979               else if (neg_inc)
 980                 {
 981                   cmp_const = unroll_number - i;
 982                   cmp_code = GE;
 983                 }
 984               else
 985                 {
 986                   cmp_const = i;
 987                   cmp_code = LE;
 988                 }
 989
 990               emit_cmp_and_jump_insns (diff, GEN_INT (abs_inc * cmp_const),
 991                                        cmp_code, NULL_RTX, mode, 0, labels[i]);
 992               JUMP_LABEL (get_last_insn ()) = labels[i];
 993               LABEL_NUSES (labels[i])++;
 994               predict_insn (get_last_insn (), PRED_LOOP_PRECONDITIONING,
 995                             REG_BR_PROB_BASE / (unroll_number - i));
 996             }
 997
 998           /* If the increment is greater than one, then we need another branch,
 999              to handle other cases equivalent to 0.  */
1000
1001           /* ??? This should be merged into the code above somehow to help
1002              simplify the code here, and reduce the number of branches emitted.
1003              For the negative increment case, the branch here could easily
1004              be merged with the `0' case branch above.  For the positive
1005              increment case, it is not clear how this can be simplified.  */
1006
1007           if (abs_inc != 1)
1008             {
1009               int cmp_const;
1010               enum rtx_code cmp_code;
1011
1012               if (neg_inc)
1013                 {
1014                   cmp_const = abs_inc - 1;
1015                   cmp_code = LE;
1016                 }
1017               else
1018                 {
1019                   cmp_const = abs_inc * (unroll_number - 1) + 1;
1020                   cmp_code = GE;
1021                 }
1022
1023               emit_cmp_and_jump_insns (diff, GEN_INT (cmp_const), cmp_code,
1024                                        NULL_RTX, mode, 0, labels[0]);
1025               JUMP_LABEL (get_last_insn ()) = labels[0];
1026               LABEL_NUSES (labels[0])++;
1027             }
1028
1029           sequence = get_insns ();
1030           end_sequence ();
1031           loop_insn_hoist (loop, sequence);
1032
1033           /* Only the last copy of the loop body here needs the exit
1034              test, so set copy_end to exclude the compare/branch here,
1035              and then reset it inside the loop when get to the last
1036              copy.  */
1037
1038           if (GET_CODE (last_loop_insn) == BARRIER)
1039             copy_end = PREV_INSN (PREV_INSN (last_loop_insn));
1040           else if (GET_CODE (last_loop_insn) == JUMP_INSN)
1041             {
1042               copy_end = PREV_INSN (last_loop_insn);
1043 #ifdef HAVE_cc0
1044               /* The immediately preceding insn may be a compare which
1045                  we do not want to copy.  */
1046               if (sets_cc0_p (PREV_INSN (copy_end)))
1047                 copy_end = PREV_INSN (copy_end);
1048 #endif
1049             }
1050           else
1051             abort ();
1052
1053           for (i = 1; i < unroll_number; i++)
1054             {
1055               emit_label_after (labels[unroll_number - i],
1056                                 PREV_INSN (loop_start));
1057
1058               memset ((char *) map->insn_map, 0, max_insnno * sizeof (rtx));
1059               memset ((char *) &VARRAY_CONST_EQUIV (map->const_equiv_varray, 0),
1060                       0, (VARRAY_SIZE (map->const_equiv_varray)
1061                           * sizeof (struct const_equiv_data)));
1062               map->const_age = 0;
1063
1064               for (j = 0; j < max_labelno; j++)
1065                 if (local_label[j])
1066                   set_label_in_map (map, j, gen_label_rtx ());
1067
1068               for (r = FIRST_PSEUDO_REGISTER; r < max_local_regnum; r++)
1069                 if (local_regno[r])
1070                   {
1071                     map->reg_map[r]
1072                       = gen_reg_rtx (GET_MODE (regno_reg_rtx[r]));
1073                     record_base_value (REGNO (map->reg_map[r]),
1074                                        regno_reg_rtx[r], 0);
1075                   }
1076               /* The last copy needs the compare/branch insns at the end,
1077                  so reset copy_end here if the loop ends with a conditional
1078                  branch.  */
1079
1080               if (i == unroll_number - 1)
1081                 {
1082                   if (GET_CODE (last_loop_insn) == BARRIER)
1083                     copy_end = PREV_INSN (PREV_INSN (last_loop_insn));
1084                   else
1085                     copy_end = last_loop_insn;
1086                 }
1087
1088               /* None of the copies are the `last_iteration', so just
1089                  pass zero for that parameter.  */
1090               copy_loop_body (loop, copy_start, copy_end, map, exit_label, 0,
1091                               unroll_type, start_label, loop_end,
1092                               loop_start, copy_end);
1093             }
1094           emit_label_after (labels[0], PREV_INSN (loop_start));
1095
1096           if (GET_CODE (last_loop_insn) == BARRIER)
1097             {
1098               insert_before = PREV_INSN (last_loop_insn);
1099               copy_end = PREV_INSN (insert_before);
1100             }
1101           else
1102             {
1103               insert_before = last_loop_insn;
1104 #ifdef HAVE_cc0
1105               /* The instruction immediately before the JUMP_INSN may
1106                  be a compare instruction which we do not want to copy
1107                  or delete.  */
1108               if (sets_cc0_p (PREV_INSN (insert_before)))
1109                 insert_before = PREV_INSN (insert_before);
1110 #endif
1111               copy_end = PREV_INSN (insert_before);
1112             }
1113
1114           /* Set unroll type to MODULO now.  */
1115           unroll_type = UNROLL_MODULO;
1116           loop_preconditioned = 1;
1117
1118           /* Clean up.  */
1119           free (labels);
1120         }
1121     }
1122
1123   /* If reach here, and the loop type is UNROLL_NAIVE, then don't unroll
1124      the loop unless all loops are being unrolled.  */
1125   if (unroll_type == UNROLL_NAIVE && ! flag_unroll_all_loops)
1126     {
1127       if (loop_dump_stream)
1128         fprintf (loop_dump_stream,
1129                  "Unrolling failure: Naive unrolling not being done.\n");
1130       goto egress;
1131     }
1132
1133   /* At this point, we are guaranteed to unroll the loop.  */
1134
1135   /* Keep track of the unroll factor for the loop.  */
1136   loop_info->unroll_number = unroll_number;
1137
1138   /* For each biv and giv, determine whether it can be safely split into
1139      a different variable for each unrolled copy of the loop body.
1140      We precalculate and save this info here, since computing it is
1141      expensive.
1142
1143      Do this before deleting any instructions from the loop, so that
1144      back_branch_in_range_p will work correctly.  */
1145
1146   if (splitting_not_safe)
1147     temp = 0;
1148   else
1149     temp = find_splittable_regs (loop, unroll_type, unroll_number);
1150
1151   /* find_splittable_regs may have created some new registers, so must
1152      reallocate the reg_map with the new larger size, and must realloc
1153      the constant maps also.  */
1154
1155   maxregnum = max_reg_num ();
1156   map->reg_map = (rtx *) xmalloc (maxregnum * sizeof (rtx));
1157
1158   init_reg_map (map, maxregnum);
1159
1160   if (map->const_equiv_varray == 0)
1161     VARRAY_CONST_EQUIV_INIT (map->const_equiv_varray,
1162                              maxregnum + temp * unroll_number * 2,
1163                              "unroll_loop");
1164   global_const_equiv_varray = map->const_equiv_varray;
1165
1166   /* Search the list of bivs and givs to find ones which need to be remapped
1167      when split, and set their reg_map entry appropriately.  */
1168
1169   for (bl = ivs->list; bl; bl = bl->next)
1170     {
1171       if (REGNO (bl->biv->src_reg) != bl->regno)
1172         map->reg_map[bl->regno] = bl->biv->src_reg;
1173 #if 0
1174       /* Currently, non-reduced/final-value givs are never split.  */
1175       for (v = bl->giv; v; v = v->next_iv)
1176         if (REGNO (v->src_reg) != bl->regno)
1177           map->reg_map[REGNO (v->dest_reg)] = v->src_reg;
1178 #endif
1179     }
1180
1181   /* Use our current register alignment and pointer flags.  */
1182   map->regno_pointer_align = cfun->emit->regno_pointer_align;
1183   map->x_regno_reg_rtx = cfun->emit->x_regno_reg_rtx;
1184
1185   /* If the loop is being partially unrolled, and the iteration variables
1186      are being split, and are being renamed for the split, then must fix up
1187      the compare/jump instruction at the end of the loop to refer to the new
1188      registers.  This compare isn't copied, so the registers used in it
1189      will never be replaced if it isn't done here.  */
1190
1191   if (unroll_type == UNROLL_MODULO)
1192     {
1193       insn = NEXT_INSN (copy_end);
1194       if (GET_CODE (insn) == INSN || GET_CODE (insn) == JUMP_INSN)
1195         PATTERN (insn) = remap_split_bivs (loop, PATTERN (insn));
1196     }
1197
1198   /* For unroll_number times, make a copy of each instruction
1199      between copy_start and copy_end, and insert these new instructions
1200      before the end of the loop.  */
1201
1202   for (i = 0; i < unroll_number; i++)
1203     {
1204       memset ((char *) map->insn_map, 0, max_insnno * sizeof (rtx));
1205       memset ((char *) &VARRAY_CONST_EQUIV (map->const_equiv_varray, 0), 0,
1206               VARRAY_SIZE (map->const_equiv_varray) * sizeof (struct const_equiv_data));
1207       map->const_age = 0;
1208
1209       for (j = 0; j < max_labelno; j++)
1210         if (local_label[j])
1211           set_label_in_map (map, j, gen_label_rtx ());
1212
1213       for (r = FIRST_PSEUDO_REGISTER; r < max_local_regnum; r++)
1214         if (local_regno[r])
1215           {
1216             map->reg_map[r] = gen_reg_rtx (GET_MODE (regno_reg_rtx[r]));
1217             record_base_value (REGNO (map->reg_map[r]),
1218                                regno_reg_rtx[r], 0);
1219           }
1220
1221       /* If loop starts with a branch to the test, then fix it so that
1222          it points to the test of the first unrolled copy of the loop.  */
1223       if (i == 0 && loop_start != copy_start)
1224         {
1225           insn = PREV_INSN (copy_start);
1226           pattern = PATTERN (insn);
1227
1228           tem = get_label_from_map (map,
1229                                     CODE_LABEL_NUMBER
1230                                     (XEXP (SET_SRC (pattern), 0)));
1231           SET_SRC (pattern) = gen_rtx_LABEL_REF (VOIDmode, tem);
1232
1233           /* Set the jump label so that it can be used by later loop unrolling
1234              passes.  */
1235           JUMP_LABEL (insn) = tem;
1236           LABEL_NUSES (tem)++;
1237         }
1238
1239       copy_loop_body (loop, copy_start, copy_end, map, exit_label,
1240                       i == unroll_number - 1, unroll_type, start_label,
1241                       loop_end, insert_before, insert_before);
1242     }
1243
1244   /* Before deleting any insns, emit a CODE_LABEL immediately after the last
1245      insn to be deleted.  This prevents any runaway delete_insn call from
1246      more insns that it should, as it always stops at a CODE_LABEL.  */
1247
1248   /* Delete the compare and branch at the end of the loop if completely
1249      unrolling the loop.  Deleting the backward branch at the end also
1250      deletes the code label at the start of the loop.  This is done at
1251      the very end to avoid problems with back_branch_in_range_p.  */
1252
1253   if (unroll_type == UNROLL_COMPLETELY)
1254     safety_label = emit_label_after (gen_label_rtx (), last_loop_insn);
1255   else
1256     safety_label = emit_label_after (gen_label_rtx (), copy_end);
1257
1258   /* Delete all of the original loop instructions.  Don't delete the
1259      LOOP_BEG note, or the first code label in the loop.  */
1260
1261   insn = NEXT_INSN (copy_start);
1262   while (insn != safety_label)
1263     {
1264       /* ??? Don't delete named code labels.  They will be deleted when the
1265          jump that references them is deleted.  Otherwise, we end up deleting
1266          them twice, which causes them to completely disappear instead of turn
1267          into NOTE_INSN_DELETED_LABEL notes.  This in turn causes aborts in
1268          dwarfout.c/dwarf2out.c.  We could perhaps fix the dwarf*out.c files
1269          to handle deleted labels instead.  Or perhaps fix DECL_RTL of the
1270          associated LABEL_DECL to point to one of the new label instances.  */
1271       /* ??? Likewise, we can't delete a NOTE_INSN_DELETED_LABEL note.  */
1272       if (insn != start_label
1273           && ! (GET_CODE (insn) == CODE_LABEL && LABEL_NAME (insn))
1274           && ! (GET_CODE (insn) == NOTE
1275                 && NOTE_LINE_NUMBER (insn) == NOTE_INSN_DELETED_LABEL))
1276         insn = delete_related_insns (insn);
1277       else
1278         insn = NEXT_INSN (insn);
1279     }
1280
1281   /* Can now delete the 'safety' label emitted to protect us from runaway
1282      delete_related_insns calls.  */
1283   if (INSN_DELETED_P (safety_label))
1284     abort ();
1285   delete_related_insns (safety_label);
1286
1287   /* If exit_label exists, emit it after the loop.  Doing the emit here
1288      forces it to have a higher INSN_UID than any insn in the unrolled loop.
1289      This is needed so that mostly_true_jump in reorg.c will treat jumps
1290      to this loop end label correctly, i.e. predict that they are usually
1291      not taken.  */
1292   if (exit_label)
1293     emit_label_after (exit_label, loop_end);
1294
1295  egress:
1296   if (unroll_type == UNROLL_COMPLETELY)
1297     {
1298       /* Remove the loop notes since this is no longer a loop.  */
1299       if (loop->vtop)
1300         delete_related_insns (loop->vtop);
1301       if (loop->cont)
1302         delete_related_insns (loop->cont);
1303       if (loop_start)
1304         delete_related_insns (loop_start);
1305       if (loop_end)
1306         delete_related_insns (loop_end);
1307     }
1308
1309   if (map->const_equiv_varray)
1310     VARRAY_FREE (map->const_equiv_varray);
1311   if (map->label_map)
1312     {
1313       free (map->label_map);
1314       free (local_label);
1315     }
1316   free (map->insn_map);
1317   free (splittable_regs);
1318   free (splittable_regs_updates);
1319   free (addr_combined_regs);
1320   free (local_regno);
1321   if (map->reg_map)
1322     free (map->reg_map);
1323   free (map);
1324 }
1325 \f
1326 /* Return true if the loop can be safely, and profitably, preconditioned
1327    so that the unrolled copies of the loop body don't need exit tests.
1328
1329    This only works if final_value, initial_value and increment can be
1330    determined, and if increment is a constant power of 2.
1331    If increment is not a power of 2, then the preconditioning modulo
1332    operation would require a real modulo instead of a boolean AND, and this
1333    is not considered `profitable'.  */
1334
1335 /* ??? If the loop is known to be executed very many times, or the machine
1336    has a very cheap divide instruction, then preconditioning is a win even
1337    when the increment is not a power of 2.  Use RTX_COST to compute
1338    whether divide is cheap.
1339    ??? A divide by constant doesn't actually need a divide, look at
1340    expand_divmod.  The reduced cost of this optimized modulo is not
1341    reflected in RTX_COST.  */
1342
1343 int
1344 precondition_loop_p (loop, initial_value, final_value, increment, mode)
1345      const struct loop *loop;
1346      rtx *initial_value, *final_value, *increment;
1347      enum machine_mode *mode;
1348 {
1349   rtx loop_start = loop->start;
1350   struct loop_info *loop_info = LOOP_INFO (loop);
1351
1352   if (loop_info->n_iterations > 0)
1353     {
1354       if (INTVAL (loop_info->increment) > 0)
1355         {
1356           *initial_value = const0_rtx;
1357           *increment = const1_rtx;
1358           *final_value = GEN_INT (loop_info->n_iterations);
1359         }
1360       else
1361         {
1362           *initial_value = GEN_INT (loop_info->n_iterations);
1363           *increment = constm1_rtx;
1364           *final_value = const0_rtx;
1365         }
1366       *mode = word_mode;
1367
1368       if (loop_dump_stream)
1369         {
1370           fputs ("Preconditioning: Success, number of iterations known, ",
1371                  loop_dump_stream);
1372           fprintf (loop_dump_stream, HOST_WIDE_INT_PRINT_DEC,
1373                    loop_info->n_iterations);
1374           fputs (".\n", loop_dump_stream);
1375         }
1376       return 1;
1377     }
1378
1379   if (loop_info->iteration_var == 0)
1380     {
1381       if (loop_dump_stream)
1382         fprintf (loop_dump_stream,
1383                  "Preconditioning: Could not find iteration variable.\n");
1384       return 0;
1385     }
1386   else if (loop_info->initial_value == 0)
1387     {
1388       if (loop_dump_stream)
1389         fprintf (loop_dump_stream,
1390                  "Preconditioning: Could not find initial value.\n");
1391       return 0;
1392     }
1393   else if (loop_info->increment == 0)
1394     {
1395       if (loop_dump_stream)
1396         fprintf (loop_dump_stream,
1397                  "Preconditioning: Could not find increment value.\n");
1398       return 0;
1399     }
1400   else if (GET_CODE (loop_info->increment) != CONST_INT)
1401     {
1402       if (loop_dump_stream)
1403         fprintf (loop_dump_stream,
1404                  "Preconditioning: Increment not a constant.\n");
1405       return 0;
1406     }
1407   else if ((exact_log2 (INTVAL (loop_info->increment)) < 0)
1408            && (exact_log2 (-INTVAL (loop_info->increment)) < 0))
1409     {
1410       if (loop_dump_stream)
1411         fprintf (loop_dump_stream,
1412                  "Preconditioning: Increment not a constant power of 2.\n");
1413       return 0;
1414     }
1415
1416   /* Unsigned_compare and compare_dir can be ignored here, since they do
1417      not matter for preconditioning.  */
1418
1419   if (loop_info->final_value == 0)
1420     {
1421       if (loop_dump_stream)
1422         fprintf (loop_dump_stream,
1423                  "Preconditioning: EQ comparison loop.\n");
1424       return 0;
1425     }
1426
1427   /* Must ensure that final_value is invariant, so call
1428      loop_invariant_p to check.  Before doing so, must check regno
1429      against max_reg_before_loop to make sure that the register is in
1430      the range covered by loop_invariant_p.  If it isn't, then it is
1431      most likely a biv/giv which by definition are not invariant.  */
1432   if ((GET_CODE (loop_info->final_value) == REG
1433        && REGNO (loop_info->final_value) >= max_reg_before_loop)
1434       || (GET_CODE (loop_info->final_value) == PLUS
1435           && REGNO (XEXP (loop_info->final_value, 0)) >= max_reg_before_loop)
1436       || ! loop_invariant_p (loop, loop_info->final_value))
1437     {
1438       if (loop_dump_stream)
1439         fprintf (loop_dump_stream,
1440                  "Preconditioning: Final value not invariant.\n");
1441       return 0;
1442     }
1443
1444   /* Fail for floating point values, since the caller of this function
1445      does not have code to deal with them.  */
1446   if (GET_MODE_CLASS (GET_MODE (loop_info->final_value)) == MODE_FLOAT
1447       || GET_MODE_CLASS (GET_MODE (loop_info->initial_value)) == MODE_FLOAT)
1448     {
1449       if (loop_dump_stream)
1450         fprintf (loop_dump_stream,
1451                  "Preconditioning: Floating point final or initial value.\n");
1452       return 0;
1453     }
1454
1455   /* Fail if loop_info->iteration_var is not live before loop_start,
1456      since we need to test its value in the preconditioning code.  */
1457
1458   if (REGNO_FIRST_LUID (REGNO (loop_info->iteration_var))
1459       > INSN_LUID (loop_start))
1460     {
1461       if (loop_dump_stream)
1462         fprintf (loop_dump_stream,
1463                  "Preconditioning: Iteration var not live before loop start.\n");
1464       return 0;
1465     }
1466
1467   /* Note that loop_iterations biases the initial value for GIV iterators
1468      such as "while (i-- > 0)" so that we can calculate the number of
1469      iterations just like for BIV iterators.
1470
1471      Also note that the absolute values of initial_value and
1472      final_value are unimportant as only their difference is used for
1473      calculating the number of loop iterations.  */
1474   *initial_value = loop_info->initial_value;
1475   *increment = loop_info->increment;
1476   *final_value = loop_info->final_value;
1477
1478   /* Decide what mode to do these calculations in.  Choose the larger
1479      of final_value's mode and initial_value's mode, or a full-word if
1480      both are constants.  */
1481   *mode = GET_MODE (*final_value);
1482   if (*mode == VOIDmode)
1483     {
1484       *mode = GET_MODE (*initial_value);
1485       if (*mode == VOIDmode)
1486         *mode = word_mode;
1487     }
1488   else if (*mode != GET_MODE (*initial_value)
1489            && (GET_MODE_SIZE (*mode)
1490                < GET_MODE_SIZE (GET_MODE (*initial_value))))
1491     *mode = GET_MODE (*initial_value);
1492
1493   /* Success!  */
1494   if (loop_dump_stream)
1495     fprintf (loop_dump_stream, "Preconditioning: Successful.\n");
1496   return 1;
1497 }
1498
1499 /* All pseudo-registers must be mapped to themselves.  Two hard registers
1500    must be mapped, VIRTUAL_STACK_VARS_REGNUM and VIRTUAL_INCOMING_ARGS_
1501    REGNUM, to avoid function-inlining specific conversions of these
1502    registers.  All other hard regs can not be mapped because they may be
1503    used with different
1504    modes.  */
1505
1506 static void
1507 init_reg_map (map, maxregnum)
1508      struct inline_remap *map;
1509      int maxregnum;
1510 {
1511   int i;
1512
1513   for (i = maxregnum - 1; i > LAST_VIRTUAL_REGISTER; i--)
1514     map->reg_map[i] = regno_reg_rtx[i];
1515   /* Just clear the rest of the entries.  */
1516   for (i = LAST_VIRTUAL_REGISTER; i >= 0; i--)
1517     map->reg_map[i] = 0;
1518
1519   map->reg_map[VIRTUAL_STACK_VARS_REGNUM]
1520     = regno_reg_rtx[VIRTUAL_STACK_VARS_REGNUM];
1521   map->reg_map[VIRTUAL_INCOMING_ARGS_REGNUM]
1522     = regno_reg_rtx[VIRTUAL_INCOMING_ARGS_REGNUM];
1523 }
1524 \f
1525 /* Strength-reduction will often emit code for optimized biv/givs which
1526    calculates their value in a temporary register, and then copies the result
1527    to the iv.  This procedure reconstructs the pattern computing the iv;
1528    verifying that all operands are of the proper form.
1529
1530    PATTERN must be the result of single_set.
1531    The return value is the amount that the giv is incremented by.  */
1532
1533 static rtx
1534 calculate_giv_inc (pattern, src_insn, regno)
1535      rtx pattern, src_insn;
1536      unsigned int regno;
1537 {
1538   rtx increment;
1539   rtx increment_total = 0;
1540   int tries = 0;
1541
1542  retry:
1543   /* Verify that we have an increment insn here.  First check for a plus
1544      as the set source.  */
1545   if (GET_CODE (SET_SRC (pattern)) != PLUS)
1546     {
1547       /* SR sometimes computes the new giv value in a temp, then copies it
1548          to the new_reg.  */
1549       src_insn = PREV_INSN (src_insn);
1550       pattern = single_set (src_insn);
1551       if (GET_CODE (SET_SRC (pattern)) != PLUS)
1552         abort ();
1553
1554       /* The last insn emitted is not needed, so delete it to avoid confusing
1555          the second cse pass.  This insn sets the giv unnecessarily.  */
1556       delete_related_insns (get_last_insn ());
1557     }
1558
1559   /* Verify that we have a constant as the second operand of the plus.  */
1560   increment = XEXP (SET_SRC (pattern), 1);
1561   if (GET_CODE (increment) != CONST_INT)
1562     {
1563       /* SR sometimes puts the constant in a register, especially if it is
1564          too big to be an add immed operand.  */
1565       increment = find_last_value (increment, &src_insn, NULL_RTX, 0);
1566
1567       /* SR may have used LO_SUM to compute the constant if it is too large
1568          for a load immed operand.  In this case, the constant is in operand
1569          one of the LO_SUM rtx.  */
1570       if (GET_CODE (increment) == LO_SUM)
1571         increment = XEXP (increment, 1);
1572
1573       /* Some ports store large constants in memory and add a REG_EQUAL
1574          note to the store insn.  */
1575       else if (GET_CODE (increment) == MEM)
1576         {
1577           rtx note = find_reg_note (src_insn, REG_EQUAL, 0);
1578           if (note)
1579             increment = XEXP (note, 0);
1580         }
1581
1582       else if (GET_CODE (increment) == IOR
1583                || GET_CODE (increment) == ASHIFT
1584                || GET_CODE (increment) == PLUS)
1585         {
1586           /* The rs6000 port loads some constants with IOR.
1587              The alpha port loads some constants with ASHIFT and PLUS.  */
1588           rtx second_part = XEXP (increment, 1);
1589           enum rtx_code code = GET_CODE (increment);
1590
1591           increment = find_last_value (XEXP (increment, 0),
1592                                        &src_insn, NULL_RTX, 0);
1593           /* Don't need the last insn anymore.  */
1594           delete_related_insns (get_last_insn ());
1595
1596           if (GET_CODE (second_part) != CONST_INT
1597               || GET_CODE (increment) != CONST_INT)
1598             abort ();
1599
1600           if (code == IOR)
1601             increment = GEN_INT (INTVAL (increment) | INTVAL (second_part));
1602           else if (code == PLUS)
1603             increment = GEN_INT (INTVAL (increment) + INTVAL (second_part));
1604           else
1605             increment = GEN_INT (INTVAL (increment) << INTVAL (second_part));
1606         }
1607
1608       if (GET_CODE (increment) != CONST_INT)
1609         abort ();
1610
1611       /* The insn loading the constant into a register is no longer needed,
1612          so delete it.  */
1613       delete_related_insns (get_last_insn ());
1614     }
1615
1616   if (increment_total)
1617     increment_total = GEN_INT (INTVAL (increment_total) + INTVAL (increment));
1618   else
1619     increment_total = increment;
1620
1621   /* Check that the source register is the same as the register we expected
1622      to see as the source.  If not, something is seriously wrong.  */
1623   if (GET_CODE (XEXP (SET_SRC (pattern), 0)) != REG
1624       || REGNO (XEXP (SET_SRC (pattern), 0)) != regno)
1625     {
1626       /* Some machines (e.g. the romp), may emit two add instructions for
1627          certain constants, so lets try looking for another add immediately
1628          before this one if we have only seen one add insn so far.  */
1629
1630       if (tries == 0)
1631         {
1632           tries++;
1633
1634           src_insn = PREV_INSN (src_insn);
1635           pattern = single_set (src_insn);
1636
1637           delete_related_insns (get_last_insn ());
1638
1639           goto retry;
1640         }
1641
1642       abort ();
1643     }
1644
1645   return increment_total;
1646 }
1647
1648 /* Copy REG_NOTES, except for insn references, because not all insn_map
1649    entries are valid yet.  We do need to copy registers now though, because
1650    the reg_map entries can change during copying.  */
1651
1652 static rtx
1653 initial_reg_note_copy (notes, map)
1654      rtx notes;
1655      struct inline_remap *map;
1656 {
1657   rtx copy;
1658
1659   if (notes == 0)
1660     return 0;
1661
1662   copy = rtx_alloc (GET_CODE (notes));
1663   PUT_REG_NOTE_KIND (copy, REG_NOTE_KIND (notes));
1664
1665   if (GET_CODE (notes) == EXPR_LIST)
1666     XEXP (copy, 0) = copy_rtx_and_substitute (XEXP (notes, 0), map, 0);
1667   else if (GET_CODE (notes) == INSN_LIST)
1668     /* Don't substitute for these yet.  */
1669     XEXP (copy, 0) = copy_rtx (XEXP (notes, 0));
1670   else
1671     abort ();
1672
1673   XEXP (copy, 1) = initial_reg_note_copy (XEXP (notes, 1), map);
1674
1675   return copy;
1676 }
1677
1678 /* Fixup insn references in copied REG_NOTES.  */
1679
1680 static void
1681 final_reg_note_copy (notesp, map)
1682      rtx *notesp;
1683      struct inline_remap *map;
1684 {
1685   while (*notesp)
1686     {
1687       rtx note = *notesp;
1688
1689       if (GET_CODE (note) == INSN_LIST)
1690         {
1691           /* Sometimes, we have a REG_WAS_0 note that points to a
1692              deleted instruction.  In that case, we can just delete the
1693              note.  */
1694           if (REG_NOTE_KIND (note) == REG_WAS_0)
1695             {
1696               *notesp = XEXP (note, 1);
1697               continue;
1698             }
1699           else
1700             {
1701               rtx insn = map->insn_map[INSN_UID (XEXP (note, 0))];
1702
1703               /* If we failed to remap the note, something is awry.
1704                  Allow REG_LABEL as it may reference label outside
1705                  the unrolled loop.  */
1706               if (!insn)
1707                 {
1708                   if (REG_NOTE_KIND (note) != REG_LABEL)
1709                     abort ();
1710                 }
1711               else
1712                 XEXP (note, 0) = insn;
1713             }
1714         }
1715
1716       notesp = &XEXP (note, 1);
1717     }
1718 }
1719
1720 /* Copy each instruction in the loop, substituting from map as appropriate.
1721    This is very similar to a loop in expand_inline_function.  */
1722
1723 static void
1724 copy_loop_body (loop, copy_start, copy_end, map, exit_label, last_iteration,
1725                 unroll_type, start_label, loop_end, insert_before,
1726                 copy_notes_from)
1727      struct loop *loop;
1728      rtx copy_start, copy_end;
1729      struct inline_remap *map;
1730      rtx exit_label;
1731      int last_iteration;
1732      enum unroll_types unroll_type;
1733      rtx start_label, loop_end, insert_before, copy_notes_from;
1734 {
1735   struct loop_ivs *ivs = LOOP_IVS (loop);
1736   rtx insn, pattern;
1737   rtx set, tem, copy = NULL_RTX;
1738   int dest_reg_was_split, i;
1739 #ifdef HAVE_cc0
1740   rtx cc0_insn = 0;
1741 #endif
1742   rtx final_label = 0;
1743   rtx giv_inc, giv_dest_reg, giv_src_reg;
1744
1745   /* If this isn't the last iteration, then map any references to the
1746      start_label to final_label.  Final label will then be emitted immediately
1747      after the end of this loop body if it was ever used.
1748
1749      If this is the last iteration, then map references to the start_label
1750      to itself.  */
1751   if (! last_iteration)
1752     {
1753       final_label = gen_label_rtx ();
1754       set_label_in_map (map, CODE_LABEL_NUMBER (start_label), final_label);
1755     }
1756   else
1757     set_label_in_map (map, CODE_LABEL_NUMBER (start_label), start_label);
1758
1759   start_sequence ();
1760
1761   insn = copy_start;
1762   do
1763     {
1764       insn = NEXT_INSN (insn);
1765
1766       map->orig_asm_operands_vector = 0;
1767
1768       switch (GET_CODE (insn))
1769         {
1770         case INSN:
1771           pattern = PATTERN (insn);
1772           copy = 0;
1773           giv_inc = 0;
1774
1775           /* Check to see if this is a giv that has been combined with
1776              some split address givs.  (Combined in the sense that
1777              `combine_givs' in loop.c has put two givs in the same register.)
1778              In this case, we must search all givs based on the same biv to
1779              find the address givs.  Then split the address givs.
1780              Do this before splitting the giv, since that may map the
1781              SET_DEST to a new register.  */
1782
1783           if ((set = single_set (insn))
1784               && GET_CODE (SET_DEST (set)) == REG
1785               && addr_combined_regs[REGNO (SET_DEST (set))])
1786             {
1787               struct iv_class *bl;
1788               struct induction *v, *tv;
1789               unsigned int regno = REGNO (SET_DEST (set));
1790
1791               v = addr_combined_regs[REGNO (SET_DEST (set))];
1792               bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
1793
1794               /* Although the giv_inc amount is not needed here, we must call
1795                  calculate_giv_inc here since it might try to delete the
1796                  last insn emitted.  If we wait until later to call it,
1797                  we might accidentally delete insns generated immediately
1798                  below by emit_unrolled_add.  */
1799
1800               giv_inc = calculate_giv_inc (set, insn, regno);
1801
1802               /* Now find all address giv's that were combined with this
1803                  giv 'v'.  */
1804               for (tv = bl->giv; tv; tv = tv->next_iv)
1805                 if (tv->giv_type == DEST_ADDR && tv->same == v)
1806                   {
1807                     int this_giv_inc;
1808
1809                     /* If this DEST_ADDR giv was not split, then ignore it.  */
1810                     if (*tv->location != tv->dest_reg)
1811                       continue;
1812
1813                     /* Scale this_giv_inc if the multiplicative factors of
1814                        the two givs are different.  */
1815                     this_giv_inc = INTVAL (giv_inc);
1816                     if (tv->mult_val != v->mult_val)
1817                       this_giv_inc = (this_giv_inc / INTVAL (v->mult_val)
1818                                       * INTVAL (tv->mult_val));
1819
1820                     tv->dest_reg = plus_constant (tv->dest_reg, this_giv_inc);
1821                     *tv->location = tv->dest_reg;
1822
1823                     if (last_iteration && unroll_type != UNROLL_COMPLETELY)
1824                       {
1825                         /* Must emit an insn to increment the split address
1826                            giv.  Add in the const_adjust field in case there
1827                            was a constant eliminated from the address.  */
1828                         rtx value, dest_reg;
1829
1830                         /* tv->dest_reg will be either a bare register,
1831                            or else a register plus a constant.  */
1832                         if (GET_CODE (tv->dest_reg) == REG)
1833                           dest_reg = tv->dest_reg;
1834                         else
1835                           dest_reg = XEXP (tv->dest_reg, 0);
1836
1837                         /* Check for shared address givs, and avoid
1838                            incrementing the shared pseudo reg more than
1839                            once.  */
1840                         if (! tv->same_insn && ! tv->shared)
1841                           {
1842                             /* tv->dest_reg may actually be a (PLUS (REG)
1843                                (CONST)) here, so we must call plus_constant
1844                                to add the const_adjust amount before calling
1845                                emit_unrolled_add below.  */
1846                             value = plus_constant (tv->dest_reg,
1847                                                    tv->const_adjust);
1848
1849                             if (GET_CODE (value) == PLUS)
1850                               {
1851                                 /* The constant could be too large for an add
1852                                    immediate, so can't directly emit an insn
1853                                    here.  */
1854                                 emit_unrolled_add (dest_reg, XEXP (value, 0),
1855                                                    XEXP (value, 1));
1856                               }
1857                           }
1858
1859                         /* Reset the giv to be just the register again, in case
1860                            it is used after the set we have just emitted.
1861                            We must subtract the const_adjust factor added in
1862                            above.  */
1863                         tv->dest_reg = plus_constant (dest_reg,
1864                                                       -tv->const_adjust);
1865                         *tv->location = tv->dest_reg;
1866                       }
1867                   }
1868             }
1869
1870           /* If this is a setting of a splittable variable, then determine
1871              how to split the variable, create a new set based on this split,
1872              and set up the reg_map so that later uses of the variable will
1873              use the new split variable.  */
1874
1875           dest_reg_was_split = 0;
1876
1877           if ((set = single_set (insn))
1878               && GET_CODE (SET_DEST (set)) == REG
1879               && splittable_regs[REGNO (SET_DEST (set))])
1880             {
1881               unsigned int regno = REGNO (SET_DEST (set));
1882               unsigned int src_regno;
1883
1884               dest_reg_was_split = 1;
1885
1886               giv_dest_reg = SET_DEST (set);
1887               giv_src_reg = giv_dest_reg;
1888               /* Compute the increment value for the giv, if it wasn't
1889                  already computed above.  */
1890               if (giv_inc == 0)
1891                 giv_inc = calculate_giv_inc (set, insn, regno);
1892
1893               src_regno = REGNO (giv_src_reg);
1894
1895               if (unroll_type == UNROLL_COMPLETELY)
1896                 {
1897                   /* Completely unrolling the loop.  Set the induction
1898                      variable to a known constant value.  */
1899
1900                   /* The value in splittable_regs may be an invariant
1901                      value, so we must use plus_constant here.  */
1902                   splittable_regs[regno]
1903                     = plus_constant (splittable_regs[src_regno],
1904                                      INTVAL (giv_inc));
1905
1906                   if (GET_CODE (splittable_regs[regno]) == PLUS)
1907                     {
1908                       giv_src_reg = XEXP (splittable_regs[regno], 0);
1909                       giv_inc = XEXP (splittable_regs[regno], 1);
1910                     }
1911                   else
1912                     {
1913                       /* The splittable_regs value must be a REG or a
1914                          CONST_INT, so put the entire value in the giv_src_reg
1915                          variable.  */
1916                       giv_src_reg = splittable_regs[regno];
1917                       giv_inc = const0_rtx;
1918                     }
1919                 }
1920               else
1921                 {
1922                   /* Partially unrolling loop.  Create a new pseudo
1923                      register for the iteration variable, and set it to
1924                      be a constant plus the original register.  Except
1925                      on the last iteration, when the result has to
1926                      go back into the original iteration var register.  */
1927
1928                   /* Handle bivs which must be mapped to a new register
1929                      when split.  This happens for bivs which need their
1930                      final value set before loop entry.  The new register
1931                      for the biv was stored in the biv's first struct
1932                      induction entry by find_splittable_regs.  */
1933
1934                   if (regno < ivs->n_regs
1935                       && REG_IV_TYPE (ivs, regno) == BASIC_INDUCT)
1936                     {
1937                       giv_src_reg = REG_IV_CLASS (ivs, regno)->biv->src_reg;
1938                       giv_dest_reg = giv_src_reg;
1939                     }
1940
1941 #if 0
1942                   /* If non-reduced/final-value givs were split, then
1943                      this would have to remap those givs also.  See
1944                      find_splittable_regs.  */
1945 #endif
1946
1947                   splittable_regs[regno]
1948                     = simplify_gen_binary (PLUS, GET_MODE (giv_src_reg),
1949                                            giv_inc,
1950                                            splittable_regs[src_regno]);
1951                   giv_inc = splittable_regs[regno];
1952
1953                   /* Now split the induction variable by changing the dest
1954                      of this insn to a new register, and setting its
1955                      reg_map entry to point to this new register.
1956
1957                      If this is the last iteration, and this is the last insn
1958                      that will update the iv, then reuse the original dest,
1959                      to ensure that the iv will have the proper value when
1960                      the loop exits or repeats.
1961
1962                      Using splittable_regs_updates here like this is safe,
1963                      because it can only be greater than one if all
1964                      instructions modifying the iv are always executed in
1965                      order.  */
1966
1967                   if (! last_iteration
1968                       || (splittable_regs_updates[regno]-- != 1))
1969                     {
1970                       tem = gen_reg_rtx (GET_MODE (giv_src_reg));
1971                       giv_dest_reg = tem;
1972                       map->reg_map[regno] = tem;
1973                       record_base_value (REGNO (tem),
1974                                          giv_inc == const0_rtx
1975                                          ? giv_src_reg
1976                                          : gen_rtx_PLUS (GET_MODE (giv_src_reg),
1977                                                          giv_src_reg, giv_inc),
1978                                          1);
1979                     }
1980                   else
1981                     map->reg_map[regno] = giv_src_reg;
1982                 }
1983
1984               /* The constant being added could be too large for an add
1985                  immediate, so can't directly emit an insn here.  */
1986               emit_unrolled_add (giv_dest_reg, giv_src_reg, giv_inc);
1987               copy = get_last_insn ();
1988               pattern = PATTERN (copy);
1989             }
1990           else
1991             {
1992               pattern = copy_rtx_and_substitute (pattern, map, 0);
1993               copy = emit_insn (pattern);
1994             }
1995           REG_NOTES (copy) = initial_reg_note_copy (REG_NOTES (insn), map);
1996           INSN_SCOPE (copy) = INSN_SCOPE (insn);
1997
1998 #ifdef HAVE_cc0
1999           /* If this insn is setting CC0, it may need to look at
2000              the insn that uses CC0 to see what type of insn it is.
2001              In that case, the call to recog via validate_change will
2002              fail.  So don't substitute constants here.  Instead,
2003              do it when we emit the following insn.
2004
2005              For example, see the pyr.md file.  That machine has signed and
2006              unsigned compares.  The compare patterns must check the
2007              following branch insn to see which what kind of compare to
2008              emit.
2009
2010              If the previous insn set CC0, substitute constants on it as
2011              well.  */
2012           if (sets_cc0_p (PATTERN (copy)) != 0)
2013             cc0_insn = copy;
2014           else
2015             {
2016               if (cc0_insn)
2017                 try_constants (cc0_insn, map);
2018               cc0_insn = 0;
2019               try_constants (copy, map);
2020             }
2021 #else
2022           try_constants (copy, map);
2023 #endif
2024
2025           /* Make split induction variable constants `permanent' since we
2026              know there are no backward branches across iteration variable
2027              settings which would invalidate this.  */
2028           if (dest_reg_was_split)
2029             {
2030               int regno = REGNO (SET_DEST (set));
2031
2032               if ((size_t) regno < VARRAY_SIZE (map->const_equiv_varray)
2033                   && (VARRAY_CONST_EQUIV (map->const_equiv_varray, regno).age
2034                       == map->const_age))
2035                 VARRAY_CONST_EQUIV (map->const_equiv_varray, regno).age = -1;
2036             }
2037           break;
2038
2039         case JUMP_INSN:
2040           pattern = copy_rtx_and_substitute (PATTERN (insn), map, 0);
2041           copy = emit_jump_insn (pattern);
2042           REG_NOTES (copy) = initial_reg_note_copy (REG_NOTES (insn), map);
2043           INSN_SCOPE (copy) = INSN_SCOPE (insn);
2044
2045           if (JUMP_LABEL (insn))
2046             {
2047               JUMP_LABEL (copy) = get_label_from_map (map,
2048                                                       CODE_LABEL_NUMBER
2049                                                       (JUMP_LABEL (insn)));
2050               LABEL_NUSES (JUMP_LABEL (copy))++;
2051             }
2052           if (JUMP_LABEL (insn) == start_label && insn == copy_end
2053               && ! last_iteration)
2054             {
2055
2056               /* This is a branch to the beginning of the loop; this is the
2057                  last insn being copied; and this is not the last iteration.
2058                  In this case, we want to change the original fall through
2059                  case to be a branch past the end of the loop, and the
2060                  original jump label case to fall_through.  */
2061
2062               if (!invert_jump (copy, exit_label, 0))
2063                 {
2064                   rtx jmp;
2065                   rtx lab = gen_label_rtx ();
2066                   /* Can't do it by reversing the jump (probably because we
2067                      couldn't reverse the conditions), so emit a new
2068                      jump_insn after COPY, and redirect the jump around
2069                      that.  */
2070                   jmp = emit_jump_insn_after (gen_jump (exit_label), copy);
2071                   JUMP_LABEL (jmp) = exit_label;
2072                   LABEL_NUSES (exit_label)++;
2073                   jmp = emit_barrier_after (jmp);
2074                   emit_label_after (lab, jmp);
2075                   LABEL_NUSES (lab) = 0;
2076                   if (!redirect_jump (copy, lab, 0))
2077                     abort ();
2078                 }
2079             }
2080
2081 #ifdef HAVE_cc0
2082           if (cc0_insn)
2083             try_constants (cc0_insn, map);
2084           cc0_insn = 0;
2085 #endif
2086           try_constants (copy, map);
2087
2088           /* Set the jump label of COPY correctly to avoid problems with
2089              later passes of unroll_loop, if INSN had jump label set.  */
2090           if (JUMP_LABEL (insn))
2091             {
2092               rtx label = 0;
2093
2094               /* Can't use the label_map for every insn, since this may be
2095                  the backward branch, and hence the label was not mapped.  */
2096               if ((set = single_set (copy)))
2097                 {
2098                   tem = SET_SRC (set);
2099                   if (GET_CODE (tem) == LABEL_REF)
2100                     label = XEXP (tem, 0);
2101                   else if (GET_CODE (tem) == IF_THEN_ELSE)
2102                     {
2103                       if (XEXP (tem, 1) != pc_rtx)
2104                         label = XEXP (XEXP (tem, 1), 0);
2105                       else
2106                         label = XEXP (XEXP (tem, 2), 0);
2107                     }
2108                 }
2109
2110               if (label && GET_CODE (label) == CODE_LABEL)
2111                 JUMP_LABEL (copy) = label;
2112               else
2113                 {
2114                   /* An unrecognizable jump insn, probably the entry jump
2115                      for a switch statement.  This label must have been mapped,
2116                      so just use the label_map to get the new jump label.  */
2117                   JUMP_LABEL (copy)
2118                     = get_label_from_map (map,
2119                                           CODE_LABEL_NUMBER (JUMP_LABEL (insn)));
2120                 }
2121
2122               /* If this is a non-local jump, then must increase the label
2123                  use count so that the label will not be deleted when the
2124                  original jump is deleted.  */
2125               LABEL_NUSES (JUMP_LABEL (copy))++;
2126             }
2127           else if (GET_CODE (PATTERN (copy)) == ADDR_VEC
2128                    || GET_CODE (PATTERN (copy)) == ADDR_DIFF_VEC)
2129             {
2130               rtx pat = PATTERN (copy);
2131               int diff_vec_p = GET_CODE (pat) == ADDR_DIFF_VEC;
2132               int len = XVECLEN (pat, diff_vec_p);
2133               int i;
2134
2135               for (i = 0; i < len; i++)
2136                 LABEL_NUSES (XEXP (XVECEXP (pat, diff_vec_p, i), 0))++;
2137             }
2138
2139           /* If this used to be a conditional jump insn but whose branch
2140              direction is now known, we must do something special.  */
2141           if (any_condjump_p (insn) && onlyjump_p (insn) && map->last_pc_value)
2142             {
2143 #ifdef HAVE_cc0
2144               /* If the previous insn set cc0 for us, delete it.  */
2145               if (only_sets_cc0_p (PREV_INSN (copy)))
2146                 delete_related_insns (PREV_INSN (copy));
2147 #endif
2148
2149               /* If this is now a no-op, delete it.  */
2150               if (map->last_pc_value == pc_rtx)
2151                 {
2152                   delete_insn (copy);
2153                   copy = 0;
2154                 }
2155               else
2156                 /* Otherwise, this is unconditional jump so we must put a
2157                    BARRIER after it.  We could do some dead code elimination
2158                    here, but jump.c will do it just as well.  */
2159                 emit_barrier ();
2160             }
2161           break;
2162
2163         case CALL_INSN:
2164           pattern = copy_rtx_and_substitute (PATTERN (insn), map, 0);
2165           copy = emit_call_insn (pattern);
2166           REG_NOTES (copy) = initial_reg_note_copy (REG_NOTES (insn), map);
2167           INSN_SCOPE (copy) = INSN_SCOPE (insn);
2168           SIBLING_CALL_P (copy) = SIBLING_CALL_P (insn);
2169
2170           /* Because the USAGE information potentially contains objects other
2171              than hard registers, we need to copy it.  */
2172           CALL_INSN_FUNCTION_USAGE (copy)
2173             = copy_rtx_and_substitute (CALL_INSN_FUNCTION_USAGE (insn),
2174                                        map, 0);
2175
2176 #ifdef HAVE_cc0
2177           if (cc0_insn)
2178             try_constants (cc0_insn, map);
2179           cc0_insn = 0;
2180 #endif
2181           try_constants (copy, map);
2182
2183           /* Be lazy and assume CALL_INSNs clobber all hard registers.  */
2184           for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
2185             VARRAY_CONST_EQUIV (map->const_equiv_varray, i).rtx = 0;
2186           break;
2187
2188         case CODE_LABEL:
2189           /* If this is the loop start label, then we don't need to emit a
2190              copy of this label since no one will use it.  */
2191
2192           if (insn != start_label)
2193             {
2194               copy = emit_label (get_label_from_map (map,
2195                                                      CODE_LABEL_NUMBER (insn)));
2196               map->const_age++;
2197             }
2198           break;
2199
2200         case BARRIER:
2201           copy = emit_barrier ();
2202           break;
2203
2204         case NOTE:
2205           /* VTOP and CONT notes are valid only before the loop exit test.
2206              If placed anywhere else, loop may generate bad code.  */
2207           /* BASIC_BLOCK notes exist to stabilize basic block structures with
2208              the associated rtl.  We do not want to share the structure in
2209              this new block.  */
2210
2211           if (NOTE_LINE_NUMBER (insn) != NOTE_INSN_DELETED
2212               && NOTE_LINE_NUMBER (insn) != NOTE_INSN_DELETED_LABEL
2213               && NOTE_LINE_NUMBER (insn) != NOTE_INSN_BASIC_BLOCK
2214               && ((NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_VTOP
2215                    && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_CONT)
2216                   || (last_iteration && unroll_type != UNROLL_COMPLETELY)))
2217             copy = emit_note (NOTE_SOURCE_FILE (insn),
2218                               NOTE_LINE_NUMBER (insn));
2219           else
2220             copy = 0;
2221           break;
2222
2223         default:
2224           abort ();
2225         }
2226
2227       map->insn_map[INSN_UID (insn)] = copy;
2228     }
2229   while (insn != copy_end);
2230
2231   /* Now finish coping the REG_NOTES.  */
2232   insn = copy_start;
2233   do
2234     {
2235       insn = NEXT_INSN (insn);
2236       if ((GET_CODE (insn) == INSN || GET_CODE (insn) == JUMP_INSN
2237            || GET_CODE (insn) == CALL_INSN)
2238           && map->insn_map[INSN_UID (insn)])
2239         final_reg_note_copy (&REG_NOTES (map->insn_map[INSN_UID (insn)]), map);
2240     }
2241   while (insn != copy_end);
2242
2243   /* There may be notes between copy_notes_from and loop_end.  Emit a copy of
2244      each of these notes here, since there may be some important ones, such as
2245      NOTE_INSN_BLOCK_END notes, in this group.  We don't do this on the last
2246      iteration, because the original notes won't be deleted.
2247
2248      We can't use insert_before here, because when from preconditioning,
2249      insert_before points before the loop.  We can't use copy_end, because
2250      there may be insns already inserted after it (which we don't want to
2251      copy) when not from preconditioning code.  */
2252
2253   if (! last_iteration)
2254     {
2255       for (insn = copy_notes_from; insn != loop_end; insn = NEXT_INSN (insn))
2256         {
2257           /* VTOP notes are valid only before the loop exit test.
2258              If placed anywhere else, loop may generate bad code.
2259              There is no need to test for NOTE_INSN_LOOP_CONT notes
2260              here, since COPY_NOTES_FROM will be at most one or two (for cc0)
2261              instructions before the last insn in the loop, and if the
2262              end test is that short, there will be a VTOP note between
2263              the CONT note and the test.  */
2264           if (GET_CODE (insn) == NOTE
2265               && NOTE_LINE_NUMBER (insn) != NOTE_INSN_DELETED
2266               && NOTE_LINE_NUMBER (insn) != NOTE_INSN_BASIC_BLOCK
2267               && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_VTOP)
2268             emit_note (NOTE_SOURCE_FILE (insn), NOTE_LINE_NUMBER (insn));
2269         }
2270     }
2271
2272   if (final_label && LABEL_NUSES (final_label) > 0)
2273     emit_label (final_label);
2274
2275   tem = get_insns ();
2276   end_sequence ();
2277   loop_insn_emit_before (loop, 0, insert_before, tem);
2278 }
2279 \f
2280 /* Emit an insn, using the expand_binop to ensure that a valid insn is
2281    emitted.  This will correctly handle the case where the increment value
2282    won't fit in the immediate field of a PLUS insns.  */
2283
2284 void
2285 emit_unrolled_add (dest_reg, src_reg, increment)
2286      rtx dest_reg, src_reg, increment;
2287 {
2288   rtx result;
2289
2290   result = expand_simple_binop (GET_MODE (dest_reg), PLUS, src_reg, increment,
2291                                 dest_reg, 0, OPTAB_LIB_WIDEN);
2292
2293   if (dest_reg != result)
2294     emit_move_insn (dest_reg, result);
2295 }
2296 \f
2297 /* Searches the insns between INSN and LOOP->END.  Returns 1 if there
2298    is a backward branch in that range that branches to somewhere between
2299    LOOP->START and INSN.  Returns 0 otherwise.  */
2300
2301 /* ??? This is quadratic algorithm.  Could be rewritten to be linear.
2302    In practice, this is not a problem, because this function is seldom called,
2303    and uses a negligible amount of CPU time on average.  */
2304
2305 int
2306 back_branch_in_range_p (loop, insn)
2307      const struct loop *loop;
2308      rtx insn;
2309 {
2310   rtx p, q, target_insn;
2311   rtx loop_start = loop->start;
2312   rtx loop_end = loop->end;
2313   rtx orig_loop_end = loop->end;
2314
2315   /* Stop before we get to the backward branch at the end of the loop.  */
2316   loop_end = prev_nonnote_insn (loop_end);
2317   if (GET_CODE (loop_end) == BARRIER)
2318     loop_end = PREV_INSN (loop_end);
2319
2320   /* Check in case insn has been deleted, search forward for first non
2321      deleted insn following it.  */
2322   while (INSN_DELETED_P (insn))
2323     insn = NEXT_INSN (insn);
2324
2325   /* Check for the case where insn is the last insn in the loop.  Deal
2326      with the case where INSN was a deleted loop test insn, in which case
2327      it will now be the NOTE_LOOP_END.  */
2328   if (insn == loop_end || insn == orig_loop_end)
2329     return 0;
2330
2331   for (p = NEXT_INSN (insn); p != loop_end; p = NEXT_INSN (p))
2332     {
2333       if (GET_CODE (p) == JUMP_INSN)
2334         {
2335           target_insn = JUMP_LABEL (p);
2336
2337           /* Search from loop_start to insn, to see if one of them is
2338              the target_insn.  We can't use INSN_LUID comparisons here,
2339              since insn may not have an LUID entry.  */
2340           for (q = loop_start; q != insn; q = NEXT_INSN (q))
2341             if (q == target_insn)
2342               return 1;
2343         }
2344     }
2345
2346   return 0;
2347 }
2348
2349 /* Try to generate the simplest rtx for the expression
2350    (PLUS (MULT mult1 mult2) add1).  This is used to calculate the initial
2351    value of giv's.  */
2352
2353 static rtx
2354 fold_rtx_mult_add (mult1, mult2, add1, mode)
2355      rtx mult1, mult2, add1;
2356      enum machine_mode mode;
2357 {
2358   rtx temp, mult_res;
2359   rtx result;
2360
2361   /* The modes must all be the same.  This should always be true.  For now,
2362      check to make sure.  */
2363   if ((GET_MODE (mult1) != mode && GET_MODE (mult1) != VOIDmode)
2364       || (GET_MODE (mult2) != mode && GET_MODE (mult2) != VOIDmode)
2365       || (GET_MODE (add1) != mode && GET_MODE (add1) != VOIDmode))
2366     abort ();
2367
2368   /* Ensure that if at least one of mult1/mult2 are constant, then mult2
2369      will be a constant.  */
2370   if (GET_CODE (mult1) == CONST_INT)
2371     {
2372       temp = mult2;
2373       mult2 = mult1;
2374       mult1 = temp;
2375     }
2376
2377   mult_res = simplify_binary_operation (MULT, mode, mult1, mult2);
2378   if (! mult_res)
2379     mult_res = gen_rtx_MULT (mode, mult1, mult2);
2380
2381   /* Again, put the constant second.  */
2382   if (GET_CODE (add1) == CONST_INT)
2383     {
2384       temp = add1;
2385       add1 = mult_res;
2386       mult_res = temp;
2387     }
2388
2389   result = simplify_binary_operation (PLUS, mode, add1, mult_res);
2390   if (! result)
2391     result = gen_rtx_PLUS (mode, add1, mult_res);
2392
2393   return result;
2394 }
2395
2396 /* Searches the list of induction struct's for the biv BL, to try to calculate
2397    the total increment value for one iteration of the loop as a constant.
2398
2399    Returns the increment value as an rtx, simplified as much as possible,
2400    if it can be calculated.  Otherwise, returns 0.  */
2401
2402 rtx
2403 biv_total_increment (bl)
2404      const struct iv_class *bl;
2405 {
2406   struct induction *v;
2407   rtx result;
2408
2409   /* For increment, must check every instruction that sets it.  Each
2410      instruction must be executed only once each time through the loop.
2411      To verify this, we check that the insn is always executed, and that
2412      there are no backward branches after the insn that branch to before it.
2413      Also, the insn must have a mult_val of one (to make sure it really is
2414      an increment).  */
2415
2416   result = const0_rtx;
2417   for (v = bl->biv; v; v = v->next_iv)
2418     {
2419       if (v->always_computable && v->mult_val == const1_rtx
2420           && ! v->maybe_multiple)
2421         result = fold_rtx_mult_add (result, const1_rtx, v->add_val, v->mode);
2422       else
2423         return 0;
2424     }
2425
2426   return result;
2427 }
2428
2429 /* For each biv and giv, determine whether it can be safely split into
2430    a different variable for each unrolled copy of the loop body.  If it
2431    is safe to split, then indicate that by saving some useful info
2432    in the splittable_regs array.
2433
2434    If the loop is being completely unrolled, then splittable_regs will hold
2435    the current value of the induction variable while the loop is unrolled.
2436    It must be set to the initial value of the induction variable here.
2437    Otherwise, splittable_regs will hold the difference between the current
2438    value of the induction variable and the value the induction variable had
2439    at the top of the loop.  It must be set to the value 0 here.
2440
2441    Returns the total number of instructions that set registers that are
2442    splittable.  */
2443
2444 /* ?? If the loop is only unrolled twice, then most of the restrictions to
2445    constant values are unnecessary, since we can easily calculate increment
2446    values in this case even if nothing is constant.  The increment value
2447    should not involve a multiply however.  */
2448
2449 /* ?? Even if the biv/giv increment values aren't constant, it may still
2450    be beneficial to split the variable if the loop is only unrolled a few
2451    times, since multiplies by small integers (1,2,3,4) are very cheap.  */
2452
2453 static int
2454 find_splittable_regs (loop, unroll_type, unroll_number)
2455      const struct loop *loop;
2456      enum unroll_types unroll_type;
2457      int unroll_number;
2458 {
2459   struct loop_ivs *ivs = LOOP_IVS (loop);
2460   struct iv_class *bl;
2461   struct induction *v;
2462   rtx increment, tem;
2463   rtx biv_final_value;
2464   int biv_splittable;
2465   int result = 0;
2466
2467   for (bl = ivs->list; bl; bl = bl->next)
2468     {
2469       /* Biv_total_increment must return a constant value,
2470          otherwise we can not calculate the split values.  */
2471
2472       increment = biv_total_increment (bl);
2473       if (! increment || GET_CODE (increment) != CONST_INT)
2474         continue;
2475
2476       /* The loop must be unrolled completely, or else have a known number
2477          of iterations and only one exit, or else the biv must be dead
2478          outside the loop, or else the final value must be known.  Otherwise,
2479          it is unsafe to split the biv since it may not have the proper
2480          value on loop exit.  */
2481
2482       /* loop_number_exit_count is non-zero if the loop has an exit other than
2483          a fall through at the end.  */
2484
2485       biv_splittable = 1;
2486       biv_final_value = 0;
2487       if (unroll_type != UNROLL_COMPLETELY
2488           && (loop->exit_count || unroll_type == UNROLL_NAIVE)
2489           && (REGNO_LAST_LUID (bl->regno) >= INSN_LUID (loop->end)
2490               || ! bl->init_insn
2491               || INSN_UID (bl->init_insn) >= max_uid_for_loop
2492               || (REGNO_FIRST_LUID (bl->regno)
2493                   < INSN_LUID (bl->init_insn))
2494               || reg_mentioned_p (bl->biv->dest_reg, SET_SRC (bl->init_set)))
2495           && ! (biv_final_value = final_biv_value (loop, bl)))
2496         biv_splittable = 0;
2497
2498       /* If any of the insns setting the BIV don't do so with a simple
2499          PLUS, we don't know how to split it.  */
2500       for (v = bl->biv; biv_splittable && v; v = v->next_iv)
2501         if ((tem = single_set (v->insn)) == 0
2502             || GET_CODE (SET_DEST (tem)) != REG
2503             || REGNO (SET_DEST (tem)) != bl->regno
2504             || GET_CODE (SET_SRC (tem)) != PLUS)
2505           biv_splittable = 0;
2506
2507       /* If final value is non-zero, then must emit an instruction which sets
2508          the value of the biv to the proper value.  This is done after
2509          handling all of the givs, since some of them may need to use the
2510          biv's value in their initialization code.  */
2511
2512       /* This biv is splittable.  If completely unrolling the loop, save
2513          the biv's initial value.  Otherwise, save the constant zero.  */
2514
2515       if (biv_splittable == 1)
2516         {
2517           if (unroll_type == UNROLL_COMPLETELY)
2518             {
2519               /* If the initial value of the biv is itself (i.e. it is too
2520                  complicated for strength_reduce to compute), or is a hard
2521                  register, or it isn't invariant, then we must create a new
2522                  pseudo reg to hold the initial value of the biv.  */
2523
2524               if (GET_CODE (bl->initial_value) == REG
2525                   && (REGNO (bl->initial_value) == bl->regno
2526                       || REGNO (bl->initial_value) < FIRST_PSEUDO_REGISTER
2527                       || ! loop_invariant_p (loop, bl->initial_value)))
2528                 {
2529                   rtx tem = gen_reg_rtx (bl->biv->mode);
2530
2531                   record_base_value (REGNO (tem), bl->biv->add_val, 0);
2532                   loop_insn_hoist (loop,
2533                                    gen_move_insn (tem, bl->biv->src_reg));
2534
2535                   if (loop_dump_stream)
2536                     fprintf (loop_dump_stream,
2537                              "Biv %d initial value remapped to %d.\n",
2538                              bl->regno, REGNO (tem));
2539
2540                   splittable_regs[bl->regno] = tem;
2541                 }
2542               else
2543                 splittable_regs[bl->regno] = bl->initial_value;
2544             }
2545           else
2546             splittable_regs[bl->regno] = const0_rtx;
2547
2548           /* Save the number of instructions that modify the biv, so that
2549              we can treat the last one specially.  */
2550
2551           splittable_regs_updates[bl->regno] = bl->biv_count;
2552           result += bl->biv_count;
2553
2554           if (loop_dump_stream)
2555             fprintf (loop_dump_stream,
2556                      "Biv %d safe to split.\n", bl->regno);
2557         }
2558
2559       /* Check every giv that depends on this biv to see whether it is
2560          splittable also.  Even if the biv isn't splittable, givs which
2561          depend on it may be splittable if the biv is live outside the
2562          loop, and the givs aren't.  */
2563
2564       result += find_splittable_givs (loop, bl, unroll_type, increment,
2565                                       unroll_number);
2566
2567       /* If final value is non-zero, then must emit an instruction which sets
2568          the value of the biv to the proper value.  This is done after
2569          handling all of the givs, since some of them may need to use the
2570          biv's value in their initialization code.  */
2571       if (biv_final_value)
2572         {
2573           /* If the loop has multiple exits, emit the insns before the
2574              loop to ensure that it will always be executed no matter
2575              how the loop exits.  Otherwise emit the insn after the loop,
2576              since this is slightly more efficient.  */
2577           if (! loop->exit_count)
2578             loop_insn_sink (loop, gen_move_insn (bl->biv->src_reg,
2579                                                  biv_final_value));
2580           else
2581             {
2582               /* Create a new register to hold the value of the biv, and then
2583                  set the biv to its final value before the loop start.  The biv
2584                  is set to its final value before loop start to ensure that
2585                  this insn will always be executed, no matter how the loop
2586                  exits.  */
2587               rtx tem = gen_reg_rtx (bl->biv->mode);
2588               record_base_value (REGNO (tem), bl->biv->add_val, 0);
2589
2590               loop_insn_hoist (loop, gen_move_insn (tem, bl->biv->src_reg));
2591               loop_insn_hoist (loop, gen_move_insn (bl->biv->src_reg,
2592                                                     biv_final_value));
2593
2594               if (loop_dump_stream)
2595                 fprintf (loop_dump_stream, "Biv %d mapped to %d for split.\n",
2596                          REGNO (bl->biv->src_reg), REGNO (tem));
2597
2598               /* Set up the mapping from the original biv register to the new
2599                  register.  */
2600               bl->biv->src_reg = tem;
2601             }
2602         }
2603     }
2604   return result;
2605 }
2606
2607 /* Return 1 if the first and last unrolled copy of the address giv V is valid
2608    for the instruction that is using it.  Do not make any changes to that
2609    instruction.  */
2610
2611 static int
2612 verify_addresses (v, giv_inc, unroll_number)
2613      struct induction *v;
2614      rtx giv_inc;
2615      int unroll_number;
2616 {
2617   int ret = 1;
2618   rtx orig_addr = *v->location;
2619   rtx last_addr = plus_constant (v->dest_reg,
2620                                  INTVAL (giv_inc) * (unroll_number - 1));
2621
2622   /* First check to see if either address would fail.   Handle the fact
2623      that we have may have a match_dup.  */
2624   if (! validate_replace_rtx (*v->location, v->dest_reg, v->insn)
2625       || ! validate_replace_rtx (*v->location, last_addr, v->insn))
2626     ret = 0;
2627
2628   /* Now put things back the way they were before.  This should always
2629    succeed.  */
2630   if (! validate_replace_rtx (*v->location, orig_addr, v->insn))
2631     abort ();
2632
2633   return ret;
2634 }
2635
2636 /* For every giv based on the biv BL, check to determine whether it is
2637    splittable.  This is a subroutine to find_splittable_regs ().
2638
2639    Return the number of instructions that set splittable registers.  */
2640
2641 static int
2642 find_splittable_givs (loop, bl, unroll_type, increment, unroll_number)
2643      const struct loop *loop;
2644      struct iv_class *bl;
2645      enum unroll_types unroll_type;
2646      rtx increment;
2647      int unroll_number;
2648 {
2649   struct loop_ivs *ivs = LOOP_IVS (loop);
2650   struct induction *v, *v2;
2651   rtx final_value;
2652   rtx tem;
2653   int result = 0;
2654
2655   /* Scan the list of givs, and set the same_insn field when there are
2656      multiple identical givs in the same insn.  */
2657   for (v = bl->giv; v; v = v->next_iv)
2658     for (v2 = v->next_iv; v2; v2 = v2->next_iv)
2659       if (v->insn == v2->insn && rtx_equal_p (v->new_reg, v2->new_reg)
2660           && ! v2->same_insn)
2661         v2->same_insn = v;
2662
2663   for (v = bl->giv; v; v = v->next_iv)
2664     {
2665       rtx giv_inc, value;
2666
2667       /* Only split the giv if it has already been reduced, or if the loop is
2668          being completely unrolled.  */
2669       if (unroll_type != UNROLL_COMPLETELY && v->ignore)
2670         continue;
2671
2672       /* The giv can be split if the insn that sets the giv is executed once
2673          and only once on every iteration of the loop.  */
2674       /* An address giv can always be split.  v->insn is just a use not a set,
2675          and hence it does not matter whether it is always executed.  All that
2676          matters is that all the biv increments are always executed, and we
2677          won't reach here if they aren't.  */
2678       if (v->giv_type != DEST_ADDR
2679           && (! v->always_computable
2680               || back_branch_in_range_p (loop, v->insn)))
2681         continue;
2682
2683       /* The giv increment value must be a constant.  */
2684       giv_inc = fold_rtx_mult_add (v->mult_val, increment, const0_rtx,
2685                                    v->mode);
2686       if (! giv_inc || GET_CODE (giv_inc) != CONST_INT)
2687         continue;
2688
2689       /* The loop must be unrolled completely, or else have a known number of
2690          iterations and only one exit, or else the giv must be dead outside
2691          the loop, or else the final value of the giv must be known.
2692          Otherwise, it is not safe to split the giv since it may not have the
2693          proper value on loop exit.  */
2694
2695       /* The used outside loop test will fail for DEST_ADDR givs.  They are
2696          never used outside the loop anyways, so it is always safe to split a
2697          DEST_ADDR giv.  */
2698
2699       final_value = 0;
2700       if (unroll_type != UNROLL_COMPLETELY
2701           && (loop->exit_count || unroll_type == UNROLL_NAIVE)
2702           && v->giv_type != DEST_ADDR
2703           /* The next part is true if the pseudo is used outside the loop.
2704              We assume that this is true for any pseudo created after loop
2705              starts, because we don't have a reg_n_info entry for them.  */
2706           && (REGNO (v->dest_reg) >= max_reg_before_loop
2707               || (REGNO_FIRST_UID (REGNO (v->dest_reg)) != INSN_UID (v->insn)
2708                   /* Check for the case where the pseudo is set by a shift/add
2709                      sequence, in which case the first insn setting the pseudo
2710                      is the first insn of the shift/add sequence.  */
2711                   && (! (tem = find_reg_note (v->insn, REG_RETVAL, NULL_RTX))
2712                       || (REGNO_FIRST_UID (REGNO (v->dest_reg))
2713                           != INSN_UID (XEXP (tem, 0)))))
2714               /* Line above always fails if INSN was moved by loop opt.  */
2715               || (REGNO_LAST_LUID (REGNO (v->dest_reg))
2716                   >= INSN_LUID (loop->end)))
2717           && ! (final_value = v->final_value))
2718         continue;
2719
2720 #if 0
2721       /* Currently, non-reduced/final-value givs are never split.  */
2722       /* Should emit insns after the loop if possible, as the biv final value
2723          code below does.  */
2724
2725       /* If the final value is non-zero, and the giv has not been reduced,
2726          then must emit an instruction to set the final value.  */
2727       if (final_value && !v->new_reg)
2728         {
2729           /* Create a new register to hold the value of the giv, and then set
2730              the giv to its final value before the loop start.  The giv is set
2731              to its final value before loop start to ensure that this insn
2732              will always be executed, no matter how we exit.  */
2733           tem = gen_reg_rtx (v->mode);
2734           loop_insn_hoist (loop, gen_move_insn (tem, v->dest_reg));
2735           loop_insn_hoist (loop, gen_move_insn (v->dest_reg, final_value));
2736
2737           if (loop_dump_stream)
2738             fprintf (loop_dump_stream, "Giv %d mapped to %d for split.\n",
2739                      REGNO (v->dest_reg), REGNO (tem));
2740
2741           v->src_reg = tem;
2742         }
2743 #endif
2744
2745       /* This giv is splittable.  If completely unrolling the loop, save the
2746          giv's initial value.  Otherwise, save the constant zero for it.  */
2747
2748       if (unroll_type == UNROLL_COMPLETELY)
2749         {
2750           /* It is not safe to use bl->initial_value here, because it may not
2751              be invariant.  It is safe to use the initial value stored in
2752              the splittable_regs array if it is set.  In rare cases, it won't
2753              be set, so then we do exactly the same thing as
2754              find_splittable_regs does to get a safe value.  */
2755           rtx biv_initial_value;
2756
2757           if (splittable_regs[bl->regno])
2758             biv_initial_value = splittable_regs[bl->regno];
2759           else if (GET_CODE (bl->initial_value) != REG
2760                    || (REGNO (bl->initial_value) != bl->regno
2761                        && REGNO (bl->initial_value) >= FIRST_PSEUDO_REGISTER))
2762             biv_initial_value = bl->initial_value;
2763           else
2764             {
2765               rtx tem = gen_reg_rtx (bl->biv->mode);
2766
2767               record_base_value (REGNO (tem), bl->biv->add_val, 0);
2768               loop_insn_hoist (loop, gen_move_insn (tem, bl->biv->src_reg));
2769               biv_initial_value = tem;
2770             }
2771           biv_initial_value = extend_value_for_giv (v, biv_initial_value);
2772           value = fold_rtx_mult_add (v->mult_val, biv_initial_value,
2773                                      v->add_val, v->mode);
2774         }
2775       else
2776         value = const0_rtx;
2777
2778       if (v->new_reg)
2779         {
2780           /* If a giv was combined with another giv, then we can only split
2781              this giv if the giv it was combined with was reduced.  This
2782              is because the value of v->new_reg is meaningless in this
2783              case.  */
2784           if (v->same && ! v->same->new_reg)
2785             {
2786               if (loop_dump_stream)
2787                 fprintf (loop_dump_stream,
2788                          "giv combined with unreduced giv not split.\n");
2789               continue;
2790             }
2791           /* If the giv is an address destination, it could be something other
2792              than a simple register, these have to be treated differently.  */
2793           else if (v->giv_type == DEST_REG)
2794             {
2795               /* If value is not a constant, register, or register plus
2796                  constant, then compute its value into a register before
2797                  loop start.  This prevents invalid rtx sharing, and should
2798                  generate better code.  We can use bl->initial_value here
2799                  instead of splittable_regs[bl->regno] because this code
2800                  is going before the loop start.  */
2801               if (unroll_type == UNROLL_COMPLETELY
2802                   && GET_CODE (value) != CONST_INT
2803                   && GET_CODE (value) != REG
2804                   && (GET_CODE (value) != PLUS
2805                       || GET_CODE (XEXP (value, 0)) != REG
2806                       || GET_CODE (XEXP (value, 1)) != CONST_INT))
2807                 {
2808                   rtx tem = gen_reg_rtx (v->mode);
2809                   record_base_value (REGNO (tem), v->add_val, 0);
2810                   loop_iv_add_mult_hoist (loop, bl->initial_value, v->mult_val,
2811                                           v->add_val, tem);
2812                   value = tem;
2813                 }
2814
2815               splittable_regs[REGNO (v->new_reg)] = value;
2816             }
2817           else
2818             {
2819               /* Splitting address givs is useful since it will often allow us
2820                  to eliminate some increment insns for the base giv as
2821                  unnecessary.  */
2822
2823               /* If the addr giv is combined with a dest_reg giv, then all
2824                  references to that dest reg will be remapped, which is NOT
2825                  what we want for split addr regs. We always create a new
2826                  register for the split addr giv, just to be safe.  */
2827
2828               /* If we have multiple identical address givs within a
2829                  single instruction, then use a single pseudo reg for
2830                  both.  This is necessary in case one is a match_dup
2831                  of the other.  */
2832
2833               v->const_adjust = 0;
2834
2835               if (v->same_insn)
2836                 {
2837                   v->dest_reg = v->same_insn->dest_reg;
2838                   if (loop_dump_stream)
2839                     fprintf (loop_dump_stream,
2840                              "Sharing address givs in insn %d\n",
2841                              INSN_UID (v->insn));
2842                 }
2843               /* If multiple address GIVs have been combined with the
2844                  same dest_reg GIV, do not create a new register for
2845                  each.  */
2846               else if (unroll_type != UNROLL_COMPLETELY
2847                        && v->giv_type == DEST_ADDR
2848                        && v->same && v->same->giv_type == DEST_ADDR
2849                        && v->same->unrolled
2850                        /* combine_givs_p may return true for some cases
2851                           where the add and mult values are not equal.
2852                           To share a register here, the values must be
2853                           equal.  */
2854                        && rtx_equal_p (v->same->mult_val, v->mult_val)
2855                        && rtx_equal_p (v->same->add_val, v->add_val)
2856                        /* If the memory references have different modes,
2857                           then the address may not be valid and we must
2858                           not share registers.  */
2859                        && verify_addresses (v, giv_inc, unroll_number))
2860                 {
2861                   v->dest_reg = v->same->dest_reg;
2862                   v->shared = 1;
2863                 }
2864               else if (unroll_type != UNROLL_COMPLETELY)
2865                 {
2866                   /* If not completely unrolling the loop, then create a new
2867                      register to hold the split value of the DEST_ADDR giv.
2868                      Emit insn to initialize its value before loop start.  */
2869
2870                   rtx tem = gen_reg_rtx (v->mode);
2871                   struct induction *same = v->same;
2872                   rtx new_reg = v->new_reg;
2873                   record_base_value (REGNO (tem), v->add_val, 0);
2874
2875                   /* If the address giv has a constant in its new_reg value,
2876                      then this constant can be pulled out and put in value,
2877                      instead of being part of the initialization code.  */
2878
2879                   if (GET_CODE (new_reg) == PLUS
2880                       && GET_CODE (XEXP (new_reg, 1)) == CONST_INT)
2881                     {
2882                       v->dest_reg
2883                         = plus_constant (tem, INTVAL (XEXP (new_reg, 1)));
2884
2885                       /* Only succeed if this will give valid addresses.
2886                          Try to validate both the first and the last
2887                          address resulting from loop unrolling, if
2888                          one fails, then can't do const elim here.  */
2889                       if (verify_addresses (v, giv_inc, unroll_number))
2890                         {
2891                           /* Save the negative of the eliminated const, so
2892                              that we can calculate the dest_reg's increment
2893                              value later.  */
2894                           v->const_adjust = -INTVAL (XEXP (new_reg, 1));
2895
2896                           new_reg = XEXP (new_reg, 0);
2897                           if (loop_dump_stream)
2898                             fprintf (loop_dump_stream,
2899                                      "Eliminating constant from giv %d\n",
2900                                      REGNO (tem));
2901                         }
2902                       else
2903                         v->dest_reg = tem;
2904                     }
2905                   else
2906                     v->dest_reg = tem;
2907
2908                   /* If the address hasn't been checked for validity yet, do so
2909                      now, and fail completely if either the first or the last
2910                      unrolled copy of the address is not a valid address
2911                      for the instruction that uses it.  */
2912                   if (v->dest_reg == tem
2913                       && ! verify_addresses (v, giv_inc, unroll_number))
2914                     {
2915                       for (v2 = v->next_iv; v2; v2 = v2->next_iv)
2916                         if (v2->same_insn == v)
2917                           v2->same_insn = 0;
2918
2919                       if (loop_dump_stream)
2920                         fprintf (loop_dump_stream,
2921                                  "Invalid address for giv at insn %d\n",
2922                                  INSN_UID (v->insn));
2923                       continue;
2924                     }
2925
2926                   v->new_reg = new_reg;
2927                   v->same = same;
2928
2929                   /* We set this after the address check, to guarantee that
2930                      the register will be initialized.  */
2931                   v->unrolled = 1;
2932
2933                   /* To initialize the new register, just move the value of
2934                      new_reg into it.  This is not guaranteed to give a valid
2935                      instruction on machines with complex addressing modes.
2936                      If we can't recognize it, then delete it and emit insns
2937                      to calculate the value from scratch.  */
2938                   loop_insn_hoist (loop, gen_rtx_SET (VOIDmode, tem,
2939                                                       copy_rtx (v->new_reg)));
2940                   if (recog_memoized (PREV_INSN (loop->start)) < 0)
2941                     {
2942                       rtx sequence, ret;
2943
2944                       /* We can't use bl->initial_value to compute the initial
2945                          value, because the loop may have been preconditioned.
2946                          We must calculate it from NEW_REG.  */
2947                       delete_related_insns (PREV_INSN (loop->start));
2948
2949                       start_sequence ();
2950                       ret = force_operand (v->new_reg, tem);
2951                       if (ret != tem)
2952                         emit_move_insn (tem, ret);
2953                       sequence = get_insns ();
2954                       end_sequence ();
2955                       loop_insn_hoist (loop, sequence);
2956
2957                       if (loop_dump_stream)
2958                         fprintf (loop_dump_stream,
2959                                  "Invalid init insn, rewritten.\n");
2960                     }
2961                 }
2962               else
2963                 {
2964                   v->dest_reg = value;
2965
2966                   /* Check the resulting address for validity, and fail
2967                      if the resulting address would be invalid.  */
2968                   if (! verify_addresses (v, giv_inc, unroll_number))
2969                     {
2970                       for (v2 = v->next_iv; v2; v2 = v2->next_iv)
2971                         if (v2->same_insn == v)
2972                           v2->same_insn = 0;
2973
2974                       if (loop_dump_stream)
2975                         fprintf (loop_dump_stream,
2976                                  "Invalid address for giv at insn %d\n",
2977                                  INSN_UID (v->insn));
2978                       continue;
2979                     }
2980                 }
2981
2982               /* Store the value of dest_reg into the insn.  This sharing
2983                  will not be a problem as this insn will always be copied
2984                  later.  */
2985
2986               *v->location = v->dest_reg;
2987
2988               /* If this address giv is combined with a dest reg giv, then
2989                  save the base giv's induction pointer so that we will be
2990                  able to handle this address giv properly.  The base giv
2991                  itself does not have to be splittable.  */
2992
2993               if (v->same && v->same->giv_type == DEST_REG)
2994                 addr_combined_regs[REGNO (v->same->new_reg)] = v->same;
2995
2996               if (GET_CODE (v->new_reg) == REG)
2997                 {
2998                   /* This giv maybe hasn't been combined with any others.
2999                      Make sure that it's giv is marked as splittable here.  */
3000
3001                   splittable_regs[REGNO (v->new_reg)] = value;
3002
3003                   /* Make it appear to depend upon itself, so that the
3004                      giv will be properly split in the main loop above.  */
3005                   if (! v->same)
3006                     {
3007                       v->same = v;
3008                       addr_combined_regs[REGNO (v->new_reg)] = v;
3009                     }
3010                 }
3011
3012               if (loop_dump_stream)
3013                 fprintf (loop_dump_stream, "DEST_ADDR giv being split.\n");
3014             }
3015         }
3016       else
3017         {
3018 #if 0
3019           /* Currently, unreduced giv's can't be split.  This is not too much
3020              of a problem since unreduced giv's are not live across loop
3021              iterations anyways.  When unrolling a loop completely though,
3022              it makes sense to reduce&split givs when possible, as this will
3023              result in simpler instructions, and will not require that a reg
3024              be live across loop iterations.  */
3025
3026           splittable_regs[REGNO (v->dest_reg)] = value;
3027           fprintf (stderr, "Giv %d at insn %d not reduced\n",
3028                    REGNO (v->dest_reg), INSN_UID (v->insn));
3029 #else
3030           continue;
3031 #endif
3032         }
3033
3034       /* Unreduced givs are only updated once by definition.  Reduced givs
3035          are updated as many times as their biv is.  Mark it so if this is
3036          a splittable register.  Don't need to do anything for address givs
3037          where this may not be a register.  */
3038
3039       if (GET_CODE (v->new_reg) == REG)
3040         {
3041           int count = 1;
3042           if (! v->ignore)
3043             count = REG_IV_CLASS (ivs, REGNO (v->src_reg))->biv_count;
3044
3045           splittable_regs_updates[REGNO (v->new_reg)] = count;
3046         }
3047
3048       result++;
3049
3050       if (loop_dump_stream)
3051         {
3052           int regnum;
3053
3054           if (GET_CODE (v->dest_reg) == CONST_INT)
3055             regnum = -1;
3056           else if (GET_CODE (v->dest_reg) != REG)
3057             regnum = REGNO (XEXP (v->dest_reg, 0));
3058           else
3059             regnum = REGNO (v->dest_reg);
3060           fprintf (loop_dump_stream, "Giv %d at insn %d safe to split.\n",
3061                    regnum, INSN_UID (v->insn));
3062         }
3063     }
3064
3065   return result;
3066 }
3067 \f
3068 /* Try to prove that the register is dead after the loop exits.  Trace every
3069    loop exit looking for an insn that will always be executed, which sets
3070    the register to some value, and appears before the first use of the register
3071    is found.  If successful, then return 1, otherwise return 0.  */
3072
3073 /* ?? Could be made more intelligent in the handling of jumps, so that
3074    it can search past if statements and other similar structures.  */
3075
3076 static int
3077 reg_dead_after_loop (loop, reg)
3078      const struct loop *loop;
3079      rtx reg;
3080 {
3081   rtx insn, label;
3082   enum rtx_code code;
3083   int jump_count = 0;
3084   int label_count = 0;
3085
3086   /* In addition to checking all exits of this loop, we must also check
3087      all exits of inner nested loops that would exit this loop.  We don't
3088      have any way to identify those, so we just give up if there are any
3089      such inner loop exits.  */
3090
3091   for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
3092     label_count++;
3093
3094   if (label_count != loop->exit_count)
3095     return 0;
3096
3097   /* HACK: Must also search the loop fall through exit, create a label_ref
3098      here which points to the loop->end, and append the loop_number_exit_labels
3099      list to it.  */
3100   label = gen_rtx_LABEL_REF (VOIDmode, loop->end);
3101   LABEL_NEXTREF (label) = loop->exit_labels;
3102
3103   for (; label; label = LABEL_NEXTREF (label))
3104     {
3105       /* Succeed if find an insn which sets the biv or if reach end of
3106          function.  Fail if find an insn that uses the biv, or if come to
3107          a conditional jump.  */
3108
3109       insn = NEXT_INSN (XEXP (label, 0));
3110       while (insn)
3111         {
3112           code = GET_CODE (insn);
3113           if (GET_RTX_CLASS (code) == 'i')
3114             {
3115               rtx set;
3116
3117               if (reg_referenced_p (reg, PATTERN (insn)))
3118                 return 0;
3119
3120               set = single_set (insn);
3121               if (set && rtx_equal_p (SET_DEST (set), reg))
3122                 break;
3123             }
3124
3125           if (code == JUMP_INSN)
3126             {
3127               if (GET_CODE (PATTERN (insn)) == RETURN)
3128                 break;
3129               else if (!any_uncondjump_p (insn)
3130                        /* Prevent infinite loop following infinite loops.  */
3131                        || jump_count++ > 20)
3132                 return 0;
3133               else
3134                 insn = JUMP_LABEL (insn);
3135             }
3136
3137           insn = NEXT_INSN (insn);
3138         }
3139     }
3140
3141   /* Success, the register is dead on all loop exits.  */
3142   return 1;
3143 }
3144
3145 /* Try to calculate the final value of the biv, the value it will have at
3146    the end of the loop.  If we can do it, return that value.  */
3147
3148 rtx
3149 final_biv_value (loop, bl)
3150      const struct loop *loop;
3151      struct iv_class *bl;
3152 {
3153   unsigned HOST_WIDE_INT n_iterations = LOOP_INFO (loop)->n_iterations;
3154   rtx increment, tem;
3155
3156   /* ??? This only works for MODE_INT biv's.  Reject all others for now.  */
3157
3158   if (GET_MODE_CLASS (bl->biv->mode) != MODE_INT)
3159     return 0;
3160
3161   /* The final value for reversed bivs must be calculated differently than
3162      for ordinary bivs.  In this case, there is already an insn after the
3163      loop which sets this biv's final value (if necessary), and there are
3164      no other loop exits, so we can return any value.  */
3165   if (bl->reversed)
3166     {
3167       if (loop_dump_stream)
3168         fprintf (loop_dump_stream,
3169                  "Final biv value for %d, reversed biv.\n", bl->regno);
3170
3171       return const0_rtx;
3172     }
3173
3174   /* Try to calculate the final value as initial value + (number of iterations
3175      * increment).  For this to work, increment must be invariant, the only
3176      exit from the loop must be the fall through at the bottom (otherwise
3177      it may not have its final value when the loop exits), and the initial
3178      value of the biv must be invariant.  */
3179
3180   if (n_iterations != 0
3181       && ! loop->exit_count
3182       && loop_invariant_p (loop, bl->initial_value))
3183     {
3184       increment = biv_total_increment (bl);
3185
3186       if (increment && loop_invariant_p (loop, increment))
3187         {
3188           /* Can calculate the loop exit value, emit insns after loop
3189              end to calculate this value into a temporary register in
3190              case it is needed later.  */
3191
3192           tem = gen_reg_rtx (bl->biv->mode);
3193           record_base_value (REGNO (tem), bl->biv->add_val, 0);
3194           loop_iv_add_mult_sink (loop, increment, GEN_INT (n_iterations),
3195                                  bl->initial_value, tem);
3196
3197           if (loop_dump_stream)
3198             fprintf (loop_dump_stream,
3199                      "Final biv value for %d, calculated.\n", bl->regno);
3200
3201           return tem;
3202         }
3203     }
3204
3205   /* Check to see if the biv is dead at all loop exits.  */
3206   if (reg_dead_after_loop (loop, bl->biv->src_reg))
3207     {
3208       if (loop_dump_stream)
3209         fprintf (loop_dump_stream,
3210                  "Final biv value for %d, biv dead after loop exit.\n",
3211                  bl->regno);
3212
3213       return const0_rtx;
3214     }
3215
3216   return 0;
3217 }
3218
3219 /* Try to calculate the final value of the giv, the value it will have at
3220    the end of the loop.  If we can do it, return that value.  */
3221
3222 rtx
3223 final_giv_value (loop, v)
3224      const struct loop *loop;
3225      struct induction *v;
3226 {
3227   struct loop_ivs *ivs = LOOP_IVS (loop);
3228   struct iv_class *bl;
3229   rtx insn;
3230   rtx increment, tem;
3231   rtx seq;
3232   rtx loop_end = loop->end;
3233   unsigned HOST_WIDE_INT n_iterations = LOOP_INFO (loop)->n_iterations;
3234
3235   bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
3236
3237   /* The final value for givs which depend on reversed bivs must be calculated
3238      differently than for ordinary givs.  In this case, there is already an
3239      insn after the loop which sets this giv's final value (if necessary),
3240      and there are no other loop exits, so we can return any value.  */
3241   if (bl->reversed)
3242     {
3243       if (loop_dump_stream)
3244         fprintf (loop_dump_stream,
3245                  "Final giv value for %d, depends on reversed biv\n",
3246                  REGNO (v->dest_reg));
3247       return const0_rtx;
3248     }
3249
3250   /* Try to calculate the final value as a function of the biv it depends
3251      upon.  The only exit from the loop must be the fall through at the bottom
3252      and the insn that sets the giv must be executed on every iteration
3253      (otherwise the giv may not have its final value when the loop exits).  */
3254
3255   /* ??? Can calculate the final giv value by subtracting off the
3256      extra biv increments times the giv's mult_val.  The loop must have
3257      only one exit for this to work, but the loop iterations does not need
3258      to be known.  */
3259
3260   if (n_iterations != 0
3261       && ! loop->exit_count
3262       && v->always_executed)
3263     {
3264       /* ?? It is tempting to use the biv's value here since these insns will
3265          be put after the loop, and hence the biv will have its final value
3266          then.  However, this fails if the biv is subsequently eliminated.
3267          Perhaps determine whether biv's are eliminable before trying to
3268          determine whether giv's are replaceable so that we can use the
3269          biv value here if it is not eliminable.  */
3270
3271       /* We are emitting code after the end of the loop, so we must make
3272          sure that bl->initial_value is still valid then.  It will still
3273          be valid if it is invariant.  */
3274
3275       increment = biv_total_increment (bl);
3276
3277       if (increment && loop_invariant_p (loop, increment)
3278           && loop_invariant_p (loop, bl->initial_value))
3279         {
3280           /* Can calculate the loop exit value of its biv as
3281              (n_iterations * increment) + initial_value */
3282
3283           /* The loop exit value of the giv is then
3284              (final_biv_value - extra increments) * mult_val + add_val.
3285              The extra increments are any increments to the biv which
3286              occur in the loop after the giv's value is calculated.
3287              We must search from the insn that sets the giv to the end
3288              of the loop to calculate this value.  */
3289
3290           /* Put the final biv value in tem.  */
3291           tem = gen_reg_rtx (v->mode);
3292           record_base_value (REGNO (tem), bl->biv->add_val, 0);
3293           loop_iv_add_mult_sink (loop, extend_value_for_giv (v, increment),
3294                                  GEN_INT (n_iterations),
3295                                  extend_value_for_giv (v, bl->initial_value),
3296                                  tem);
3297
3298           /* Subtract off extra increments as we find them.  */
3299           for (insn = NEXT_INSN (v->insn); insn != loop_end;
3300                insn = NEXT_INSN (insn))
3301             {
3302               struct induction *biv;
3303
3304               for (biv = bl->biv; biv; biv = biv->next_iv)
3305                 if (biv->insn == insn)
3306                   {
3307                     start_sequence ();
3308                     tem = expand_simple_binop (GET_MODE (tem), MINUS, tem,
3309                                                biv->add_val, NULL_RTX, 0,
3310                                                OPTAB_LIB_WIDEN);
3311                     seq = get_insns ();
3312                     end_sequence ();
3313                     loop_insn_sink (loop, seq);
3314                   }
3315             }
3316
3317           /* Now calculate the giv's final value.  */
3318           loop_iv_add_mult_sink (loop, tem, v->mult_val, v->add_val, tem);
3319
3320           if (loop_dump_stream)
3321             fprintf (loop_dump_stream,
3322                      "Final giv value for %d, calc from biv's value.\n",
3323                      REGNO (v->dest_reg));
3324
3325           return tem;
3326         }
3327     }
3328
3329   /* Replaceable giv's should never reach here.  */
3330   if (v->replaceable)
3331     abort ();
3332
3333   /* Check to see if the biv is dead at all loop exits.  */
3334   if (reg_dead_after_loop (loop, v->dest_reg))
3335     {
3336       if (loop_dump_stream)
3337         fprintf (loop_dump_stream,
3338                  "Final giv value for %d, giv dead after loop exit.\n",
3339                  REGNO (v->dest_reg));
3340
3341       return const0_rtx;
3342     }
3343
3344   return 0;
3345 }
3346
3347 /* Look back before LOOP->START for the insn that sets REG and return
3348    the equivalent constant if there is a REG_EQUAL note otherwise just
3349    the SET_SRC of REG.  */
3350
3351 static rtx
3352 loop_find_equiv_value (loop, reg)
3353      const struct loop *loop;
3354      rtx reg;
3355 {
3356   rtx loop_start = loop->start;
3357   rtx insn, set;
3358   rtx ret;
3359
3360   ret = reg;
3361   for (insn = PREV_INSN (loop_start); insn; insn = PREV_INSN (insn))
3362     {
3363       if (GET_CODE (insn) == CODE_LABEL)
3364         break;
3365
3366       else if (INSN_P (insn) && reg_set_p (reg, insn))
3367         {
3368           /* We found the last insn before the loop that sets the register.
3369              If it sets the entire register, and has a REG_EQUAL note,
3370              then use the value of the REG_EQUAL note.  */
3371           if ((set = single_set (insn))
3372               && (SET_DEST (set) == reg))
3373             {
3374               rtx note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
3375
3376               /* Only use the REG_EQUAL note if it is a constant.
3377                  Other things, divide in particular, will cause
3378                  problems later if we use them.  */
3379               if (note && GET_CODE (XEXP (note, 0)) != EXPR_LIST
3380                   && CONSTANT_P (XEXP (note, 0)))
3381                 ret = XEXP (note, 0);
3382               else
3383                 ret = SET_SRC (set);
3384
3385               /* We cannot do this if it changes between the
3386                  assignment and loop start though.  */
3387               if (modified_between_p (ret, insn, loop_start))
3388                 ret = reg;
3389             }
3390           break;
3391         }
3392     }
3393   return ret;
3394 }
3395
3396 /* Return a simplified rtx for the expression OP - REG.
3397
3398    REG must appear in OP, and OP must be a register or the sum of a register
3399    and a second term.
3400
3401    Thus, the return value must be const0_rtx or the second term.
3402
3403    The caller is responsible for verifying that REG appears in OP and OP has
3404    the proper form.  */
3405
3406 static rtx
3407 subtract_reg_term (op, reg)
3408      rtx op, reg;
3409 {
3410   if (op == reg)
3411     return const0_rtx;
3412   if (GET_CODE (op) == PLUS)
3413     {
3414       if (XEXP (op, 0) == reg)
3415         return XEXP (op, 1);
3416       else if (XEXP (op, 1) == reg)
3417         return XEXP (op, 0);
3418     }
3419   /* OP does not contain REG as a term.  */
3420   abort ();
3421 }
3422
3423 /* Find and return register term common to both expressions OP0 and
3424    OP1 or NULL_RTX if no such term exists.  Each expression must be a
3425    REG or a PLUS of a REG.  */
3426
3427 static rtx
3428 find_common_reg_term (op0, op1)
3429      rtx op0, op1;
3430 {
3431   if ((GET_CODE (op0) == REG || GET_CODE (op0) == PLUS)
3432       && (GET_CODE (op1) == REG || GET_CODE (op1) == PLUS))
3433     {
3434       rtx op00;
3435       rtx op01;
3436       rtx op10;
3437       rtx op11;
3438
3439       if (GET_CODE (op0) == PLUS)
3440         op01 = XEXP (op0, 1), op00 = XEXP (op0, 0);
3441       else
3442         op01 = const0_rtx, op00 = op0;
3443
3444       if (GET_CODE (op1) == PLUS)
3445         op11 = XEXP (op1, 1), op10 = XEXP (op1, 0);
3446       else
3447         op11 = const0_rtx, op10 = op1;
3448
3449       /* Find and return common register term if present.  */
3450       if (REG_P (op00) && (op00 == op10 || op00 == op11))
3451         return op00;
3452       else if (REG_P (op01) && (op01 == op10 || op01 == op11))
3453         return op01;
3454     }
3455
3456   /* No common register term found.  */
3457   return NULL_RTX;
3458 }
3459
3460 /* Determine the loop iterator and calculate the number of loop
3461    iterations.  Returns the exact number of loop iterations if it can
3462    be calculated, otherwise returns zero.  */
3463
3464 unsigned HOST_WIDE_INT
3465 loop_iterations (loop)
3466      struct loop *loop;
3467 {
3468   struct loop_info *loop_info = LOOP_INFO (loop);
3469   struct loop_ivs *ivs = LOOP_IVS (loop);
3470   rtx comparison, comparison_value;
3471   rtx iteration_var, initial_value, increment, final_value;
3472   enum rtx_code comparison_code;
3473   HOST_WIDE_INT inc;
3474   unsigned HOST_WIDE_INT abs_inc;
3475   unsigned HOST_WIDE_INT abs_diff;
3476   int off_by_one;
3477   int increment_dir;
3478   int unsigned_p, compare_dir, final_larger;
3479   rtx last_loop_insn;
3480   rtx reg_term;
3481   struct iv_class *bl;
3482
3483   loop_info->n_iterations = 0;
3484   loop_info->initial_value = 0;
3485   loop_info->initial_equiv_value = 0;
3486   loop_info->comparison_value = 0;
3487   loop_info->final_value = 0;
3488   loop_info->final_equiv_value = 0;
3489   loop_info->increment = 0;
3490   loop_info->iteration_var = 0;
3491   loop_info->unroll_number = 1;
3492   loop_info->iv = 0;
3493
3494   /* We used to use prev_nonnote_insn here, but that fails because it might
3495      accidentally get the branch for a contained loop if the branch for this
3496      loop was deleted.  We can only trust branches immediately before the
3497      loop_end.  */
3498   last_loop_insn = PREV_INSN (loop->end);
3499
3500   /* ??? We should probably try harder to find the jump insn
3501      at the end of the loop.  The following code assumes that
3502      the last loop insn is a jump to the top of the loop.  */
3503   if (GET_CODE (last_loop_insn) != JUMP_INSN)
3504     {
3505       if (loop_dump_stream)
3506         fprintf (loop_dump_stream,
3507                  "Loop iterations: No final conditional branch found.\n");
3508       return 0;
3509     }
3510
3511   /* If there is a more than a single jump to the top of the loop
3512      we cannot (easily) determine the iteration count.  */
3513   if (LABEL_NUSES (JUMP_LABEL (last_loop_insn)) > 1)
3514     {
3515       if (loop_dump_stream)
3516         fprintf (loop_dump_stream,
3517                  "Loop iterations: Loop has multiple back edges.\n");
3518       return 0;
3519     }
3520
3521   /* If there are multiple conditionalized loop exit tests, they may jump
3522      back to differing CODE_LABELs.  */
3523   if (loop->top && loop->cont)
3524     {
3525       rtx temp = PREV_INSN (last_loop_insn);
3526
3527       do
3528         {
3529           if (GET_CODE (temp) == JUMP_INSN)
3530             {
3531               /* There are some kinds of jumps we can't deal with easily.  */
3532               if (JUMP_LABEL (temp) == 0)
3533                 {
3534                   if (loop_dump_stream)
3535                     fprintf
3536                       (loop_dump_stream,
3537                        "Loop iterations: Jump insn has null JUMP_LABEL.\n");
3538                   return 0;
3539                 }
3540
3541               if (/* Previous unrolling may have generated new insns not
3542                      covered by the uid_luid array.  */
3543                   INSN_UID (JUMP_LABEL (temp)) < max_uid_for_loop
3544                   /* Check if we jump back into the loop body.  */
3545                   && INSN_LUID (JUMP_LABEL (temp)) > INSN_LUID (loop->top)
3546                   && INSN_LUID (JUMP_LABEL (temp)) < INSN_LUID (loop->cont))
3547                 {
3548                   if (loop_dump_stream)
3549                     fprintf
3550                       (loop_dump_stream,
3551                        "Loop iterations: Loop has multiple back edges.\n");
3552                   return 0;
3553                 }
3554             }
3555         }
3556       while ((temp = PREV_INSN (temp)) != loop->cont);
3557     }
3558
3559   /* Find the iteration variable.  If the last insn is a conditional
3560      branch, and the insn before tests a register value, make that the
3561      iteration variable.  */
3562
3563   comparison = get_condition_for_loop (loop, last_loop_insn);
3564   if (comparison == 0)
3565     {
3566       if (loop_dump_stream)
3567         fprintf (loop_dump_stream,
3568                  "Loop iterations: No final comparison found.\n");
3569       return 0;
3570     }
3571
3572   /* ??? Get_condition may switch position of induction variable and
3573      invariant register when it canonicalizes the comparison.  */
3574
3575   comparison_code = GET_CODE (comparison);
3576   iteration_var = XEXP (comparison, 0);
3577   comparison_value = XEXP (comparison, 1);
3578
3579   if (GET_CODE (iteration_var) != REG)
3580     {
3581       if (loop_dump_stream)
3582         fprintf (loop_dump_stream,
3583                  "Loop iterations: Comparison not against register.\n");
3584       return 0;
3585     }
3586
3587   /* The only new registers that are created before loop iterations
3588      are givs made from biv increments or registers created by
3589      load_mems.  In the latter case, it is possible that try_copy_prop
3590      will propagate a new pseudo into the old iteration register but
3591      this will be marked by having the REG_USERVAR_P bit set.  */
3592
3593   if ((unsigned) REGNO (iteration_var) >= ivs->n_regs
3594       && ! REG_USERVAR_P (iteration_var))
3595     abort ();
3596
3597   /* Determine the initial value of the iteration variable, and the amount
3598      that it is incremented each loop.  Use the tables constructed by
3599      the strength reduction pass to calculate these values.  */
3600
3601   /* Clear the result values, in case no answer can be found.  */
3602   initial_value = 0;
3603   increment = 0;
3604
3605   /* The iteration variable can be either a giv or a biv.  Check to see
3606      which it is, and compute the variable's initial value, and increment
3607      value if possible.  */
3608
3609   /* If this is a new register, can't handle it since we don't have any
3610      reg_iv_type entry for it.  */
3611   if ((unsigned) REGNO (iteration_var) >= ivs->n_regs)
3612     {
3613       if (loop_dump_stream)
3614         fprintf (loop_dump_stream,
3615                  "Loop iterations: No reg_iv_type entry for iteration var.\n");
3616       return 0;
3617     }
3618
3619   /* Reject iteration variables larger than the host wide int size, since they
3620      could result in a number of iterations greater than the range of our
3621      `unsigned HOST_WIDE_INT' variable loop_info->n_iterations.  */
3622   else if ((GET_MODE_BITSIZE (GET_MODE (iteration_var))
3623             > HOST_BITS_PER_WIDE_INT))
3624     {
3625       if (loop_dump_stream)
3626         fprintf (loop_dump_stream,
3627                  "Loop iterations: Iteration var rejected because mode too large.\n");
3628       return 0;
3629     }
3630   else if (GET_MODE_CLASS (GET_MODE (iteration_var)) != MODE_INT)
3631     {
3632       if (loop_dump_stream)
3633         fprintf (loop_dump_stream,
3634                  "Loop iterations: Iteration var not an integer.\n");
3635       return 0;
3636     }
3637   else if (REG_IV_TYPE (ivs, REGNO (iteration_var)) == BASIC_INDUCT)
3638     {
3639       if (REGNO (iteration_var) >= ivs->n_regs)
3640         abort ();
3641
3642       /* Grab initial value, only useful if it is a constant.  */
3643       bl = REG_IV_CLASS (ivs, REGNO (iteration_var));
3644       initial_value = bl->initial_value;
3645       if (!bl->biv->always_executed || bl->biv->maybe_multiple)
3646         {
3647           if (loop_dump_stream)
3648             fprintf (loop_dump_stream,
3649                      "Loop iterations: Basic induction var not set once in each iteration.\n");
3650           return 0;
3651         }
3652
3653       increment = biv_total_increment (bl);
3654     }
3655   else if (REG_IV_TYPE (ivs, REGNO (iteration_var)) == GENERAL_INDUCT)
3656     {
3657       HOST_WIDE_INT offset = 0;
3658       struct induction *v = REG_IV_INFO (ivs, REGNO (iteration_var));
3659       rtx biv_initial_value;
3660
3661       if (REGNO (v->src_reg) >= ivs->n_regs)
3662         abort ();
3663
3664       if (!v->always_executed || v->maybe_multiple)
3665         {
3666           if (loop_dump_stream)
3667             fprintf (loop_dump_stream,
3668                      "Loop iterations: General induction var not set once in each iteration.\n");
3669           return 0;
3670         }
3671
3672       bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
3673
3674       /* Increment value is mult_val times the increment value of the biv.  */
3675
3676       increment = biv_total_increment (bl);
3677       if (increment)
3678         {
3679           struct induction *biv_inc;
3680
3681           increment = fold_rtx_mult_add (v->mult_val,
3682                                          extend_value_for_giv (v, increment),
3683                                          const0_rtx, v->mode);
3684           /* The caller assumes that one full increment has occurred at the
3685              first loop test.  But that's not true when the biv is incremented
3686              after the giv is set (which is the usual case), e.g.:
3687              i = 6; do {;} while (i++ < 9) .
3688              Therefore, we bias the initial value by subtracting the amount of
3689              the increment that occurs between the giv set and the giv test.  */
3690           for (biv_inc = bl->biv; biv_inc; biv_inc = biv_inc->next_iv)
3691             {
3692               if (loop_insn_first_p (v->insn, biv_inc->insn))
3693                 {
3694                   if (REG_P (biv_inc->add_val))
3695                     {
3696                       if (loop_dump_stream)
3697                         fprintf (loop_dump_stream,
3698                                  "Loop iterations: Basic induction var add_val is REG %d.\n",
3699                                  REGNO (biv_inc->add_val));
3700                         return 0;
3701                     }
3702
3703                   offset -= INTVAL (biv_inc->add_val);
3704                 }
3705             }
3706         }
3707       if (loop_dump_stream)
3708         fprintf (loop_dump_stream,
3709                  "Loop iterations: Giv iterator, initial value bias %ld.\n",
3710                  (long) offset);
3711
3712       /* Initial value is mult_val times the biv's initial value plus
3713          add_val.  Only useful if it is a constant.  */
3714       biv_initial_value = extend_value_for_giv (v, bl->initial_value);
3715       initial_value
3716         = fold_rtx_mult_add (v->mult_val,
3717                              plus_constant (biv_initial_value, offset),
3718                              v->add_val, v->mode);
3719     }
3720   else
3721     {
3722       if (loop_dump_stream)
3723         fprintf (loop_dump_stream,
3724                  "Loop iterations: Not basic or general induction var.\n");
3725       return 0;
3726     }
3727
3728   if (initial_value == 0)
3729     return 0;
3730
3731   unsigned_p = 0;
3732   off_by_one = 0;
3733   switch (comparison_code)
3734     {
3735     case LEU:
3736       unsigned_p = 1;
3737     case LE:
3738       compare_dir = 1;
3739       off_by_one = 1;
3740       break;
3741     case GEU:
3742       unsigned_p = 1;
3743     case GE:
3744       compare_dir = -1;
3745       off_by_one = -1;
3746       break;
3747     case EQ:
3748       /* Cannot determine loop iterations with this case.  */
3749       compare_dir = 0;
3750       break;
3751     case LTU:
3752       unsigned_p = 1;
3753     case LT:
3754       compare_dir = 1;
3755       break;
3756     case GTU:
3757       unsigned_p = 1;
3758     case GT:
3759       compare_dir = -1;
3760     case NE:
3761       compare_dir = 0;
3762       break;
3763     default:
3764       abort ();
3765     }
3766
3767   /* If the comparison value is an invariant register, then try to find
3768      its value from the insns before the start of the loop.  */
3769
3770   final_value = comparison_value;
3771   if (GET_CODE (comparison_value) == REG
3772       && loop_invariant_p (loop, comparison_value))
3773     {
3774       final_value = loop_find_equiv_value (loop, comparison_value);
3775
3776       /* If we don't get an invariant final value, we are better
3777          off with the original register.  */
3778       if (! loop_invariant_p (loop, final_value))
3779         final_value = comparison_value;
3780     }
3781
3782   /* Calculate the approximate final value of the induction variable
3783      (on the last successful iteration).  The exact final value
3784      depends on the branch operator, and increment sign.  It will be
3785      wrong if the iteration variable is not incremented by one each
3786      time through the loop and (comparison_value + off_by_one -
3787      initial_value) % increment != 0.
3788      ??? Note that the final_value may overflow and thus final_larger
3789      will be bogus.  A potentially infinite loop will be classified
3790      as immediate, e.g. for (i = 0x7ffffff0; i <= 0x7fffffff; i++)  */
3791   if (off_by_one)
3792     final_value = plus_constant (final_value, off_by_one);
3793
3794   /* Save the calculated values describing this loop's bounds, in case
3795      precondition_loop_p will need them later.  These values can not be
3796      recalculated inside precondition_loop_p because strength reduction
3797      optimizations may obscure the loop's structure.
3798
3799      These values are only required by precondition_loop_p and insert_bct
3800      whenever the number of iterations cannot be computed at compile time.
3801      Only the difference between final_value and initial_value is
3802      important.  Note that final_value is only approximate.  */
3803   loop_info->initial_value = initial_value;
3804   loop_info->comparison_value = comparison_value;
3805   loop_info->final_value = plus_constant (comparison_value, off_by_one);
3806   loop_info->increment = increment;
3807   loop_info->iteration_var = iteration_var;
3808   loop_info->comparison_code = comparison_code;
3809   loop_info->iv = bl;
3810
3811   /* Try to determine the iteration count for loops such
3812      as (for i = init; i < init + const; i++).  When running the
3813      loop optimization twice, the first pass often converts simple
3814      loops into this form.  */
3815
3816   if (REG_P (initial_value))
3817     {
3818       rtx reg1;
3819       rtx reg2;
3820       rtx const2;
3821
3822       reg1 = initial_value;
3823       if (GET_CODE (final_value) == PLUS)
3824         reg2 = XEXP (final_value, 0), const2 = XEXP (final_value, 1);
3825       else
3826         reg2 = final_value, const2 = const0_rtx;
3827
3828       /* Check for initial_value = reg1, final_value = reg2 + const2,
3829          where reg1 != reg2.  */
3830       if (REG_P (reg2) && reg2 != reg1)
3831         {
3832           rtx temp;
3833
3834           /* Find what reg1 is equivalent to.  Hopefully it will
3835              either be reg2 or reg2 plus a constant.  */
3836           temp = loop_find_equiv_value (loop, reg1);
3837
3838           if (find_common_reg_term (temp, reg2))
3839             initial_value = temp;
3840           else
3841             {
3842               /* Find what reg2 is equivalent to.  Hopefully it will
3843                  either be reg1 or reg1 plus a constant.  Let's ignore
3844                  the latter case for now since it is not so common.  */
3845               temp = loop_find_equiv_value (loop, reg2);
3846
3847               if (temp == loop_info->iteration_var)
3848                 temp = initial_value;
3849               if (temp == reg1)
3850                 final_value = (const2 == const0_rtx)
3851                   ? reg1 : gen_rtx_PLUS (GET_MODE (reg1), reg1, const2);
3852             }
3853         }
3854       else if (loop->vtop && GET_CODE (reg2) == CONST_INT)
3855         {
3856           rtx temp;
3857
3858           /* When running the loop optimizer twice, check_dbra_loop
3859              further obfuscates reversible loops of the form:
3860              for (i = init; i < init + const; i++).  We often end up with
3861              final_value = 0, initial_value = temp, temp = temp2 - init,
3862              where temp2 = init + const.  If the loop has a vtop we
3863              can replace initial_value with const.  */
3864
3865           temp = loop_find_equiv_value (loop, reg1);
3866
3867           if (GET_CODE (temp) == MINUS && REG_P (XEXP (temp, 0)))
3868             {
3869               rtx temp2 = loop_find_equiv_value (loop, XEXP (temp, 0));
3870
3871               if (GET_CODE (temp2) == PLUS
3872                   && XEXP (temp2, 0) == XEXP (temp, 1))
3873                 initial_value = XEXP (temp2, 1);
3874             }
3875         }
3876     }
3877
3878   /* If have initial_value = reg + const1 and final_value = reg +
3879      const2, then replace initial_value with const1 and final_value
3880      with const2.  This should be safe since we are protected by the
3881      initial comparison before entering the loop if we have a vtop.
3882      For example, a + b < a + c is not equivalent to b < c for all a
3883      when using modulo arithmetic.
3884
3885      ??? Without a vtop we could still perform the optimization if we check
3886      the initial and final values carefully.  */
3887   if (loop->vtop
3888       && (reg_term = find_common_reg_term (initial_value, final_value)))
3889     {
3890       initial_value = subtract_reg_term (initial_value, reg_term);
3891       final_value = subtract_reg_term (final_value, reg_term);
3892     }
3893
3894   loop_info->initial_equiv_value = initial_value;
3895   loop_info->final_equiv_value = final_value;
3896
3897   /* For EQ comparison loops, we don't have a valid final value.
3898      Check this now so that we won't leave an invalid value if we
3899      return early for any other reason.  */
3900   if (comparison_code == EQ)
3901     loop_info->final_equiv_value = loop_info->final_value = 0;
3902
3903   if (increment == 0)
3904     {
3905       if (loop_dump_stream)
3906         fprintf (loop_dump_stream,
3907                  "Loop iterations: Increment value can't be calculated.\n");
3908       return 0;
3909     }
3910
3911   if (GET_CODE (increment) != CONST_INT)
3912     {
3913       /* If we have a REG, check to see if REG holds a constant value.  */
3914       /* ??? Other RTL, such as (neg (reg)) is possible here, but it isn't
3915          clear if it is worthwhile to try to handle such RTL.  */
3916       if (GET_CODE (increment) == REG || GET_CODE (increment) == SUBREG)
3917         increment = loop_find_equiv_value (loop, increment);
3918
3919       if (GET_CODE (increment) != CONST_INT)
3920         {
3921           if (loop_dump_stream)
3922             {
3923               fprintf (loop_dump_stream,
3924                        "Loop iterations: Increment value not constant ");
3925               print_simple_rtl (loop_dump_stream, increment);
3926               fprintf (loop_dump_stream, ".\n");
3927             }
3928           return 0;
3929         }
3930       loop_info->increment = increment;
3931     }
3932
3933   if (GET_CODE (initial_value) != CONST_INT)
3934     {
3935       if (loop_dump_stream)
3936         {
3937           fprintf (loop_dump_stream,
3938                    "Loop iterations: Initial value not constant ");
3939           print_simple_rtl (loop_dump_stream, initial_value);
3940           fprintf (loop_dump_stream, ".\n");
3941         }
3942       return 0;
3943     }
3944   else if (comparison_code == EQ)
3945     {
3946       if (loop_dump_stream)
3947         fprintf (loop_dump_stream, "Loop iterations: EQ comparison loop.\n");
3948       return 0;
3949     }
3950   else if (GET_CODE (final_value) != CONST_INT)
3951     {
3952       if (loop_dump_stream)
3953         {
3954           fprintf (loop_dump_stream,
3955                    "Loop iterations: Final value not constant ");
3956           print_simple_rtl (loop_dump_stream, final_value);
3957           fprintf (loop_dump_stream, ".\n");
3958         }
3959       return 0;
3960     }
3961
3962   /* Final_larger is 1 if final larger, 0 if they are equal, otherwise -1.  */
3963   if (unsigned_p)
3964     final_larger
3965       = ((unsigned HOST_WIDE_INT) INTVAL (final_value)
3966          > (unsigned HOST_WIDE_INT) INTVAL (initial_value))
3967         - ((unsigned HOST_WIDE_INT) INTVAL (final_value)
3968            < (unsigned HOST_WIDE_INT) INTVAL (initial_value));
3969   else
3970     final_larger = (INTVAL (final_value) > INTVAL (initial_value))
3971       - (INTVAL (final_value) < INTVAL (initial_value));
3972
3973   if (INTVAL (increment) > 0)
3974     increment_dir = 1;
3975   else if (INTVAL (increment) == 0)
3976     increment_dir = 0;
3977   else
3978     increment_dir = -1;
3979
3980   /* There are 27 different cases: compare_dir = -1, 0, 1;
3981      final_larger = -1, 0, 1; increment_dir = -1, 0, 1.
3982      There are 4 normal cases, 4 reverse cases (where the iteration variable
3983      will overflow before the loop exits), 4 infinite loop cases, and 15
3984      immediate exit (0 or 1 iteration depending on loop type) cases.
3985      Only try to optimize the normal cases.  */
3986
3987   /* (compare_dir/final_larger/increment_dir)
3988      Normal cases: (0/-1/-1), (0/1/1), (-1/-1/-1), (1/1/1)
3989      Reverse cases: (0/-1/1), (0/1/-1), (-1/-1/1), (1/1/-1)
3990      Infinite loops: (0/-1/0), (0/1/0), (-1/-1/0), (1/1/0)
3991      Immediate exit: (0/0/X), (-1/0/X), (-1/1/X), (1/0/X), (1/-1/X) */
3992
3993   /* ?? If the meaning of reverse loops (where the iteration variable
3994      will overflow before the loop exits) is undefined, then could
3995      eliminate all of these special checks, and just always assume
3996      the loops are normal/immediate/infinite.  Note that this means
3997      the sign of increment_dir does not have to be known.  Also,
3998      since it does not really hurt if immediate exit loops or infinite loops
3999      are optimized, then that case could be ignored also, and hence all
4000      loops can be optimized.
4001
4002      According to ANSI Spec, the reverse loop case result is undefined,
4003      because the action on overflow is undefined.
4004
4005      See also the special test for NE loops below.  */
4006
4007   if (final_larger == increment_dir && final_larger != 0
4008       && (final_larger == compare_dir || compare_dir == 0))
4009     /* Normal case.  */
4010     ;
4011   else
4012     {
4013       if (loop_dump_stream)
4014         fprintf (loop_dump_stream, "Loop iterations: Not normal loop.\n");
4015       return 0;
4016     }
4017
4018   /* Calculate the number of iterations, final_value is only an approximation,
4019      so correct for that.  Note that abs_diff and n_iterations are
4020      unsigned, because they can be as large as 2^n - 1.  */
4021
4022   inc = INTVAL (increment);
4023   if (inc > 0)
4024     {
4025       abs_diff = INTVAL (final_value) - INTVAL (initial_value);
4026       abs_inc = inc;
4027     }
4028   else if (inc < 0)
4029     {
4030       abs_diff = INTVAL (initial_value) - INTVAL (final_value);
4031       abs_inc = -inc;
4032     }
4033   else
4034     abort ();
4035
4036   /* Given that iteration_var is going to iterate over its own mode,
4037      not HOST_WIDE_INT, disregard higher bits that might have come
4038      into the picture due to sign extension of initial and final
4039      values.  */
4040   abs_diff &= ((unsigned HOST_WIDE_INT) 1
4041                << (GET_MODE_BITSIZE (GET_MODE (iteration_var)) - 1)
4042                << 1) - 1;
4043
4044   /* For NE tests, make sure that the iteration variable won't miss
4045      the final value.  If abs_diff mod abs_incr is not zero, then the
4046      iteration variable will overflow before the loop exits, and we
4047      can not calculate the number of iterations.  */
4048   if (compare_dir == 0 && (abs_diff % abs_inc) != 0)
4049     return 0;
4050
4051   /* Note that the number of iterations could be calculated using
4052      (abs_diff + abs_inc - 1) / abs_inc, provided care was taken to
4053      handle potential overflow of the summation.  */
4054   loop_info->n_iterations = abs_diff / abs_inc + ((abs_diff % abs_inc) != 0);
4055   return loop_info->n_iterations;
4056 }
4057
4058 /* Replace uses of split bivs with their split pseudo register.  This is
4059    for original instructions which remain after loop unrolling without
4060    copying.  */
4061
4062 static rtx
4063 remap_split_bivs (loop, x)
4064      struct loop *loop;
4065      rtx x;
4066 {
4067   struct loop_ivs *ivs = LOOP_IVS (loop);
4068   enum rtx_code code;
4069   int i;
4070   const char *fmt;
4071
4072   if (x == 0)
4073     return x;
4074
4075   code = GET_CODE (x);
4076   switch (code)
4077     {
4078     case SCRATCH:
4079     case PC:
4080     case CC0:
4081     case CONST_INT:
4082     case CONST_DOUBLE:
4083     case CONST:
4084     case SYMBOL_REF:
4085     case LABEL_REF:
4086       return x;
4087
4088     case REG:
4089 #if 0
4090       /* If non-reduced/final-value givs were split, then this would also
4091          have to remap those givs also.  */
4092 #endif
4093       if (REGNO (x) < ivs->n_regs
4094           && REG_IV_TYPE (ivs, REGNO (x)) == BASIC_INDUCT)
4095         return REG_IV_CLASS (ivs, REGNO (x))->biv->src_reg;
4096       break;
4097
4098     default:
4099       break;
4100     }
4101
4102   fmt = GET_RTX_FORMAT (code);
4103   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
4104     {
4105       if (fmt[i] == 'e')
4106         XEXP (x, i) = remap_split_bivs (loop, XEXP (x, i));
4107       else if (fmt[i] == 'E')
4108         {
4109           int j;
4110           for (j = 0; j < XVECLEN (x, i); j++)
4111             XVECEXP (x, i, j) = remap_split_bivs (loop, XVECEXP (x, i, j));
4112         }
4113     }
4114   return x;
4115 }
4116
4117 /* If FIRST_UID is a set of REGNO, and FIRST_UID dominates LAST_UID (e.g.
4118    FIST_UID is always executed if LAST_UID is), then return 1.  Otherwise
4119    return 0.  COPY_START is where we can start looking for the insns
4120    FIRST_UID and LAST_UID.  COPY_END is where we stop looking for these
4121    insns.
4122
4123    If there is no JUMP_INSN between LOOP_START and FIRST_UID, then FIRST_UID
4124    must dominate LAST_UID.
4125
4126    If there is a CODE_LABEL between FIRST_UID and LAST_UID, then FIRST_UID
4127    may not dominate LAST_UID.
4128
4129    If there is no CODE_LABEL between FIRST_UID and LAST_UID, then FIRST_UID
4130    must dominate LAST_UID.  */
4131
4132 int
4133 set_dominates_use (regno, first_uid, last_uid, copy_start, copy_end)
4134      int regno;
4135      int first_uid;
4136      int last_uid;
4137      rtx copy_start;
4138      rtx copy_end;
4139 {
4140   int passed_jump = 0;
4141   rtx p = NEXT_INSN (copy_start);
4142
4143   while (INSN_UID (p) != first_uid)
4144     {
4145       if (GET_CODE (p) == JUMP_INSN)
4146         passed_jump = 1;
4147       /* Could not find FIRST_UID.  */
4148       if (p == copy_end)
4149         return 0;
4150       p = NEXT_INSN (p);
4151     }
4152
4153   /* Verify that FIRST_UID is an insn that entirely sets REGNO.  */
4154   if (! INSN_P (p) || ! dead_or_set_regno_p (p, regno))
4155     return 0;
4156
4157   /* FIRST_UID is always executed.  */
4158   if (passed_jump == 0)
4159     return 1;
4160
4161   while (INSN_UID (p) != last_uid)
4162     {
4163       /* If we see a CODE_LABEL between FIRST_UID and LAST_UID, then we
4164          can not be sure that FIRST_UID dominates LAST_UID.  */
4165       if (GET_CODE (p) == CODE_LABEL)
4166         return 0;
4167       /* Could not find LAST_UID, but we reached the end of the loop, so
4168          it must be safe.  */
4169       else if (p == copy_end)
4170         return 1;
4171       p = NEXT_INSN (p);
4172     }
4173
4174   /* FIRST_UID is always executed if LAST_UID is executed.  */
4175   return 1;
4176 }
4177
4178 /* This routine is called when the number of iterations for the unrolled
4179    loop is one.   The goal is to identify a loop that begins with an
4180    unconditional branch to the loop continuation note (or a label just after).
4181    In this case, the unconditional branch that starts the loop needs to be
4182    deleted so that we execute the single iteration.  */
4183
4184 static rtx
4185 ujump_to_loop_cont (loop_start, loop_cont)
4186      rtx loop_start;
4187      rtx loop_cont;
4188 {
4189   rtx x, label, label_ref;
4190
4191   /* See if loop start, or the next insn is an unconditional jump.  */
4192   loop_start = next_nonnote_insn (loop_start);
4193
4194   x = pc_set (loop_start);
4195   if (!x)
4196     return NULL_RTX;
4197
4198   label_ref = SET_SRC (x);
4199   if (!label_ref)
4200     return NULL_RTX;
4201
4202   /* Examine insn after loop continuation note.  Return if not a label.  */
4203   label = next_nonnote_insn (loop_cont);
4204   if (label == 0 || GET_CODE (label) != CODE_LABEL)
4205     return NULL_RTX;
4206
4207   /* Return the loop start if the branch label matches the code label.  */
4208   if (CODE_LABEL_NUMBER (label) == CODE_LABEL_NUMBER (XEXP (label_ref, 0)))
4209     return loop_start;
4210   else
4211     return NULL_RTX;
4212 }