gcc/gcse.c

   1 /* Global common subexpression elimination/Partial redundancy elimination
   2    and global constant/copy propagation for GNU compiler.
   3    Copyright (C) 1997, 1998, 1999 Free Software Foundation, Inc.
   4
   5 This file is part of GNU CC.
   6
   7 GNU CC is free software; you can redistribute it and/or modify
   8 it under the terms of the GNU General Public License as published by
   9 the Free Software Foundation; either version 2, or (at your option)
  10 any later version.
  11
  12 GNU CC is distributed in the hope that it will be useful,
  13 but WITHOUT ANY WARRANTY; without even the implied warranty of
  14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  15 GNU General Public License for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GNU CC; see the file COPYING.  If not, write to
  19 the Free Software Foundation, 59 Temple Place - Suite 330,
  20 Boston, MA 02111-1307, USA.  */
  21
  22 /* TODO
  23    - reordering of memory allocation and freeing to be more space efficient
  24    - do rough calc of how many regs are needed in each block, and a rough
  25      calc of how many regs are available in each class and use that to
  26      throttle back the code in cases where RTX_COST is minimal.
  27    - dead store elimination
  28    - a store to the same address as a load does not kill the load if the
  29      source of the store is also the destination of the load.  Handling this
  30      allows more load motion, particularly out of loops.
  31    - ability to realloc sbitmap vectors would allow one initial computation
  32      of reg_set_in_block with only subsequent additions, rather than
  33      recomputing it for each pass
  34
  35 */
  36
  37 /* References searched while implementing this.
  38
  39    Compilers Principles, Techniques and Tools
  40    Aho, Sethi, Ullman
  41    Addison-Wesley, 1988
  42
  43    Global Optimization by Suppression of Partial Redundancies
  44    E. Morel, C. Renvoise
  45    communications of the acm, Vol. 22, Num. 2, Feb. 1979
  46
  47    A Portable Machine-Independent Global Optimizer - Design and Measurements
  48    Frederick Chow
  49    Stanford Ph.D. thesis, Dec. 1983
  50
  51    A Fast Algorithm for Code Movement Optimization
  52    D.M. Dhamdhere
  53    SIGPLAN Notices, Vol. 23, Num. 10, Oct. 1988
  54
  55    A Solution to a Problem with Morel and Renvoise's
  56    Global Optimization by Suppression of Partial Redundancies
  57    K-H Drechsler, M.P. Stadel
  58    ACM TOPLAS, Vol. 10, Num. 4, Oct. 1988
  59
  60    Practical Adaptation of the Global Optimization
  61    Algorithm of Morel and Renvoise
  62    D.M. Dhamdhere
  63    ACM TOPLAS, Vol. 13, Num. 2. Apr. 1991
  64
  65    Efficiently Computing Static Single Assignment Form and the Control
  66    Dependence Graph
  67    R. Cytron, J. Ferrante, B.K. Rosen, M.N. Wegman, and F.K. Zadeck
  68    ACM TOPLAS, Vol. 13, Num. 4, Oct. 1991
  69
  70    Lazy Code Motion
  71    J. Knoop, O. Ruthing, B. Steffen
  72    ACM SIGPLAN Notices Vol. 27, Num. 7, Jul. 1992, '92 Conference on PLDI
  73
  74    What's In a Region?  Or Computing Control Dependence Regions in Near-Linear
  75    Time for Reducible Flow Control
  76    Thomas Ball
  77    ACM Letters on Programming Languages and Systems,
  78    Vol. 2, Num. 1-4, Mar-Dec 1993
  79
  80    An Efficient Representation for Sparse Sets
  81    Preston Briggs, Linda Torczon
  82    ACM Letters on Programming Languages and Systems,
  83    Vol. 2, Num. 1-4, Mar-Dec 1993
  84
  85    A Variation of Knoop, Ruthing, and Steffen's Lazy Code Motion
  86    K-H Drechsler, M.P. Stadel
  87    ACM SIGPLAN Notices, Vol. 28, Num. 5, May 1993
  88
  89    Partial Dead Code Elimination
  90    J. Knoop, O. Ruthing, B. Steffen
  91    ACM SIGPLAN Notices, Vol. 29, Num. 6, Jun. 1994
  92
  93    Effective Partial Redundancy Elimination
  94    P. Briggs, K.D. Cooper
  95    ACM SIGPLAN Notices, Vol. 29, Num. 6, Jun. 1994
  96
  97    The Program Structure Tree: Computing Control Regions in Linear Time
  98    R. Johnson, D. Pearson, K. Pingali
  99    ACM SIGPLAN Notices, Vol. 29, Num. 6, Jun. 1994
 100
 101    Optimal Code Motion: Theory and Practice
 102    J. Knoop, O. Ruthing, B. Steffen
 103    ACM TOPLAS, Vol. 16, Num. 4, Jul. 1994
 104
 105    The power of assignment motion
 106    J. Knoop, O. Ruthing, B. Steffen
 107    ACM SIGPLAN Notices Vol. 30, Num. 6, Jun. 1995, '95 Conference on PLDI
 108
 109    Global code motion / global value numbering
 110    C. Click
 111    ACM SIGPLAN Notices Vol. 30, Num. 6, Jun. 1995, '95 Conference on PLDI
 112
 113    Value Driven Redundancy Elimination
 114    L.T. Simpson
 115    Rice University Ph.D. thesis, Apr. 1996
 116
 117    Value Numbering
 118    L.T. Simpson
 119    Massively Scalar Compiler Project, Rice University, Sep. 1996
 120
 121    High Performance Compilers for Parallel Computing
 122    Michael Wolfe
 123    Addison-Wesley, 1996
 124
 125    Advanced Compiler Design and Implementation
 126    Steven Muchnick
 127    Morgan Kaufmann, 1997
 128
 129    Building an Optimizing Compiler
 130    Robert Morgan
 131    Digital Press, 1998
 132
 133    People wishing to speed up the code here should read:
 134      Elimination Algorithms for Data Flow Analysis
 135      B.G. Ryder, M.C. Paull
 136      ACM Computing Surveys, Vol. 18, Num. 3, Sep. 1986
 137
 138      How to Analyze Large Programs Efficiently and Informatively
 139      D.M. Dhamdhere, B.K. Rosen, F.K. Zadeck
 140      ACM SIGPLAN Notices Vol. 27, Num. 7, Jul. 1992, '92 Conference on PLDI
 141
 142    People wishing to do something different can find various possibilities
 143    in the above papers and elsewhere.
 144 */
 145
 146 #include "config.h"
 147 #include "system.h"
 148 #include "toplev.h"
 149
 150 #include "rtl.h"
 151 #include "tm_p.h"
 152 #include "regs.h"
 153 #include "hard-reg-set.h"
 154 #include "flags.h"
 155 #include "real.h"
 156 #include "insn-config.h"
 157 #include "recog.h"
 158 #include "basic-block.h"
 159 #include "output.h"
 160 #include "function.h"
 161 #include "expr.h"
 162
 163 #include "obstack.h"
 164 #define obstack_chunk_alloc gmalloc
 165 #define obstack_chunk_free free
 166
 167 /* Maximum number of passes to perform.  */
 168 #define MAX_PASSES 1
 169
 170 /* Propagate flow information through back edges and thus enable PRE's
 171    moving loop invariant calculations out of loops.
 172
 173    Originally this tended to create worse overall code, but several
 174    improvements during the development of PRE seem to have made following
 175    back edges generally a win.
 176
 177    Note much of the loop invariant code motion done here would normally
 178    be done by loop.c, which has more heuristics for when to move invariants
 179    out of loops.  At some point we might need to move some of those
 180    heuristics into gcse.c.  */
 181 #define FOLLOW_BACK_EDGES 1
 182
 183 /* We support GCSE via Partial Redundancy Elimination.  PRE optimizations
 184    are a superset of those done by GCSE.
 185
 186    We perform the following steps:
 187
 188    1) Compute basic block information.
 189
 190    2) Compute table of places where registers are set.
 191
 192    3) Perform copy/constant propagation.
 193
 194    4) Perform global cse.
 195
 196    5) Perform another pass of copy/constant propagation.
 197
 198    Two passes of copy/constant propagation are done because the first one
 199    enables more GCSE and the second one helps to clean up the copies that
 200    GCSE creates.  This is needed more for PRE than for Classic because Classic
 201    GCSE will try to use an existing register containing the common
 202    subexpression rather than create a new one.  This is harder to do for PRE
 203    because of the code motion (which Classic GCSE doesn't do).
 204
 205    Expressions we are interested in GCSE-ing are of the form
 206    (set (pseudo-reg) (expression)).
 207    Function want_to_gcse_p says what these are.
 208
 209    PRE handles moving invariant expressions out of loops (by treating them as
 210    partially redundant).
 211
 212    Eventually it would be nice to replace cse.c/gcse.c with SSA (static single
 213    assignment) based GVN (global value numbering).  L. T. Simpson's paper
 214    (Rice University) on value numbering is a useful reference for this.
 215
 216    **********************
 217
 218    We used to support multiple passes but there are diminishing returns in
 219    doing so.  The first pass usually makes 90% of the changes that are doable.
 220    A second pass can make a few more changes made possible by the first pass.
 221    Experiments show any further passes don't make enough changes to justify
 222    the expense.
 223
 224    A study of spec92 using an unlimited number of passes:
 225    [1 pass] = 1208 substitutions, [2] = 577, [3] = 202, [4] = 192, [5] = 83,
 226    [6] = 34, [7] = 17, [8] = 9, [9] = 4, [10] = 4, [11] = 2,
 227    [12] = 2, [13] = 1, [15] = 1, [16] = 2, [41] = 1
 228
 229    It was found doing copy propagation between each pass enables further
 230    substitutions.
 231
 232    PRE is quite expensive in complicated functions because the DFA can take
 233    awhile to converge.  Hence we only perform one pass.  Macro MAX_PASSES can
 234    be modified if one wants to experiment.
 235
 236    **********************
 237
 238    The steps for PRE are:
 239
 240    1) Build the hash table of expressions we wish to GCSE (expr_hash_table).
 241
 242    2) Perform the data flow analysis for PRE.
 243
 244    3) Delete the redundant instructions
 245
 246    4) Insert the required copies [if any] that make the partially
 247       redundant instructions fully redundant.
 248
 249    5) For other reaching expressions, insert an instruction to copy the value
 250       to a newly created pseudo that will reach the redundant instruction.
 251
 252    The deletion is done first so that when we do insertions we
 253    know which pseudo reg to use.
 254
 255    Various papers have argued that PRE DFA is expensive (O(n^2)) and others
 256    argue it is not.  The number of iterations for the algorithm to converge
 257    is typically 2-4 so I don't view it as that expensive (relatively speaking).
 258
 259    PRE GCSE depends heavily on the second CSE pass to clean up the copies
 260    we create.  To make an expression reach the place where it's redundant,
 261    the result of the expression is copied to a new register, and the redundant
 262    expression is deleted by replacing it with this new register.  Classic GCSE
 263    doesn't have this problem as much as it computes the reaching defs of
 264    each register in each block and thus can try to use an existing register.
 265
 266    **********************
 267
 268    A fair bit of simplicity is created by creating small functions for simple
 269    tasks, even when the function is only called in one place.  This may
 270    measurably slow things down [or may not] by creating more function call
 271    overhead than is necessary.  The source is laid out so that it's trivial
 272    to make the affected functions inline so that one can measure what speed
 273    up, if any, can be achieved, and maybe later when things settle things can
 274    be rearranged.
 275
 276    Help stamp out big monolithic functions!  */
 277 \f
 278 /* GCSE global vars.  */
 279
 280 /* -dG dump file.  */
 281 static FILE *gcse_file;
 282
 283 /* Note whether or not we should run jump optimization after gcse.  We
 284    want to do this for two cases.
 285
 286     * If we changed any jumps via cprop.
 287
 288     * If we added any labels via edge splitting.  */
 289
 290 static int run_jump_opt_after_gcse;
 291
 292 /* Bitmaps are normally not included in debugging dumps.
 293    However it's useful to be able to print them from GDB.
 294    We could create special functions for this, but it's simpler to
 295    just allow passing stderr to the dump_foo fns.  Since stderr can
 296    be a macro, we store a copy here.  */
 297 static FILE *debug_stderr;
 298
 299 /* An obstack for our working variables.  */
 300 static struct obstack gcse_obstack;
 301
 302 /* Non-zero for each mode that supports (set (reg) (reg)).
 303    This is trivially true for integer and floating point values.
 304    It may or may not be true for condition codes.  */
 305 static char can_copy_p[(int) NUM_MACHINE_MODES];
 306
 307 /* Non-zero if can_copy_p has been initialized.  */
 308 static int can_copy_init_p;
 309
 310 struct reg_use {
 311   rtx reg_rtx;
 312 };
 313
 314 /* Hash table of expressions.  */
 315
 316 struct expr
 317 {
 318   /* The expression (SET_SRC for expressions, PATTERN for assignments).  */
 319   rtx expr;
 320   /* Index in the available expression bitmaps.  */
 321   int bitmap_index;
 322   /* Next entry with the same hash.  */
 323   struct expr *next_same_hash;
 324   /* List of anticipatable occurrences in basic blocks in the function.
 325      An "anticipatable occurrence" is one that is the first occurrence in the
 326      basic block, the operands are not modified in the basic block prior
 327      to the occurrence and the output is not used between the start of
 328      the block and the occurrence.  */
 329   struct occr *antic_occr;
 330   /* List of available occurrence in basic blocks in the function.
 331      An "available occurrence" is one that is the last occurrence in the
 332      basic block and the operands are not modified by following statements in
 333      the basic block [including this insn].  */
 334   struct occr *avail_occr;
 335   /* Non-null if the computation is PRE redundant.
 336      The value is the newly created pseudo-reg to record a copy of the
 337      expression in all the places that reach the redundant copy.  */
 338   rtx reaching_reg;
 339 };
 340
 341 /* Occurrence of an expression.
 342    There is one per basic block.  If a pattern appears more than once the
 343    last appearance is used [or first for anticipatable expressions].  */
 344
 345 struct occr
 346 {
 347   /* Next occurrence of this expression.  */
 348   struct occr *next;
 349   /* The insn that computes the expression.  */
 350   rtx insn;
 351   /* Non-zero if this [anticipatable] occurrence has been deleted.  */
 352   char deleted_p;
 353   /* Non-zero if this [available] occurrence has been copied to
 354      reaching_reg.  */
 355   /* ??? This is mutually exclusive with deleted_p, so they could share
 356      the same byte.  */
 357   char copied_p;
 358 };
 359
 360 /* Expression and copy propagation hash tables.
 361    Each hash table is an array of buckets.
 362    ??? It is known that if it were an array of entries, structure elements
 363    `next_same_hash' and `bitmap_index' wouldn't be necessary.  However, it is
 364    not clear whether in the final analysis a sufficient amount of memory would
 365    be saved as the size of the available expression bitmaps would be larger
 366    [one could build a mapping table without holes afterwards though].
 367    Someday I'll perform the computation and figure it out.
 368 */
 369
 370 /* Total size of the expression hash table, in elements.  */
 371 static int expr_hash_table_size;
 372 /* The table itself.
 373    This is an array of `expr_hash_table_size' elements.  */
 374 static struct expr **expr_hash_table;
 375
 376 /* Total size of the copy propagation hash table, in elements.  */
 377 static int set_hash_table_size;
 378 /* The table itself.
 379    This is an array of `set_hash_table_size' elements.  */
 380 static struct expr **set_hash_table;
 381
 382 /* Mapping of uids to cuids.
 383    Only real insns get cuids.  */
 384 static int *uid_cuid;
 385
 386 /* Highest UID in UID_CUID.  */
 387 static int max_uid;
 388
 389 /* Get the cuid of an insn.  */
 390 #define INSN_CUID(INSN) (uid_cuid[INSN_UID (INSN)])
 391
 392 /* Number of cuids.  */
 393 static int max_cuid;
 394
 395 /* Mapping of cuids to insns.  */
 396 static rtx *cuid_insn;
 397
 398 /* Get insn from cuid.  */
 399 #define CUID_INSN(CUID) (cuid_insn[CUID])
 400
 401 /* Maximum register number in function prior to doing gcse + 1.
 402    Registers created during this pass have regno >= max_gcse_regno.
 403    This is named with "gcse" to not collide with global of same name.  */
 404 static int max_gcse_regno;
 405
 406 /* Maximum number of cse-able expressions found.  */
 407 static int n_exprs;
 408 /* Maximum number of assignments for copy propagation found.  */
 409 static int n_sets;
 410
 411 /* Table of registers that are modified.
 412    For each register, each element is a list of places where the pseudo-reg
 413    is set.
 414
 415    For simplicity, GCSE is done on sets of pseudo-regs only.  PRE GCSE only
 416    requires knowledge of which blocks kill which regs [and thus could use
 417    a bitmap instead of the lists `reg_set_table' uses].
 418
 419    `reg_set_table' and could be turned into an array of bitmaps
 420    (num-bbs x num-regs)
 421    [however perhaps it may be useful to keep the data as is].
 422    One advantage of recording things this way is that `reg_set_table' is
 423    fairly sparse with respect to pseudo regs but for hard regs could be
 424    fairly dense [relatively speaking].
 425    And recording sets of pseudo-regs in lists speeds
 426    up functions like compute_transp since in the case of pseudo-regs we only
 427    need to iterate over the number of times a pseudo-reg is set, not over the
 428    number of basic blocks [clearly there is a bit of a slow down in the cases
 429    where a pseudo is set more than once in a block, however it is believed
 430    that the net effect is to speed things up].  This isn't done for hard-regs
 431    because recording call-clobbered hard-regs in `reg_set_table' at each
 432    function call can consume a fair bit of memory, and iterating over hard-regs
 433    stored this way in compute_transp will be more expensive.  */
 434
 435 typedef struct reg_set {
 436   /* The next setting of this register.  */
 437   struct reg_set *next;
 438   /* The insn where it was set.  */
 439   rtx insn;
 440 } reg_set;
 441 static reg_set **reg_set_table;
 442 /* Size of `reg_set_table'.
 443    The table starts out at max_gcse_regno + slop, and is enlarged as
 444    necessary.  */
 445 static int reg_set_table_size;
 446 /* Amount to grow `reg_set_table' by when it's full.  */
 447 #define REG_SET_TABLE_SLOP 100
 448
 449 /* Bitmap containing one bit for each register in the program.
 450    Used when performing GCSE to track which registers have been set since
 451    the start of the basic block.  */
 452 static sbitmap reg_set_bitmap;
 453
 454 /* For each block, a bitmap of registers set in the block.
 455    This is used by expr_killed_p and compute_transp.
 456    It is computed during hash table computation and not by compute_sets
 457    as it includes registers added since the last pass (or between cprop and
 458    gcse) and it's currently not easy to realloc sbitmap vectors.  */
 459 static sbitmap *reg_set_in_block;
 460
 461 /* For each block, non-zero if memory is set in that block.
 462    This is computed during hash table computation and is used by
 463    expr_killed_p and compute_transp.
 464    ??? Handling of memory is very simple, we don't make any attempt
 465    to optimize things (later).
 466    ??? This can be computed by compute_sets since the information
 467    doesn't change.  */
 468 static char *mem_set_in_block;
 469
 470 /* Various variables for statistics gathering.  */
 471
 472 /* Memory used in a pass.
 473    This isn't intended to be absolutely precise.  Its intent is only
 474    to keep an eye on memory usage.  */
 475 static int bytes_used;
 476 /* GCSE substitutions made.  */
 477 static int gcse_subst_count;
 478 /* Number of copy instructions created.  */
 479 static int gcse_create_count;
 480 /* Number of constants propagated.  */
 481 static int const_prop_count;
 482 /* Number of copys propagated.  */
 483 static int copy_prop_count;
 484 \f
 485 /* These variables are used by classic GCSE.
 486    Normally they'd be defined a bit later, but `rd_gen' needs to
 487    be declared sooner.  */
 488
 489 /* A bitmap of all ones for implementing the algorithm for available
 490    expressions and reaching definitions.  */
 491 /* ??? Available expression bitmaps have a different size than reaching
 492    definition bitmaps.  This should be the larger of the two, however, it
 493    is not currently used for reaching definitions.  */
 494 static sbitmap u_bitmap;
 495
 496 /* Each block has a bitmap of each type.
 497    The length of each blocks bitmap is:
 498
 499        max_cuid  - for reaching definitions
 500        n_exprs - for available expressions
 501
 502    Thus we view the bitmaps as 2 dimensional arrays.  i.e.
 503    rd_kill[block_num][cuid_num]
 504    ae_kill[block_num][expr_num]
 505 */
 506
 507 /* For reaching defs */
 508 static sbitmap *rd_kill, *rd_gen, *reaching_defs, *rd_out;
 509
 510 /* for available exprs */
 511 static sbitmap *ae_kill, *ae_gen, *ae_in, *ae_out;
 512
 513 \f
 514 static void compute_can_copy      PROTO ((void));
 515
 516 static char *gmalloc              PROTO ((unsigned int));
 517 static char *grealloc            PROTO ((char *, unsigned int));
 518 static char *gcse_alloc        PROTO ((unsigned long));
 519 static void alloc_gcse_mem          PROTO ((rtx));
 520 static void free_gcse_mem            PROTO ((void));
 521 static void alloc_reg_set_mem    PROTO ((int));
 522 static void free_reg_set_mem      PROTO ((void));
 523 static void record_one_set          PROTO ((int, rtx));
 524 static void record_set_info        PROTO ((rtx, rtx));
 525 static void compute_sets              PROTO ((rtx));
 526
 527 static void hash_scan_insn          PROTO ((rtx, int, int));
 528 static void hash_scan_set            PROTO ((rtx, rtx, int));
 529 static void hash_scan_clobber    PROTO ((rtx, rtx));
 530 static void hash_scan_call          PROTO ((rtx, rtx));
 531 static int want_to_gcse_p            PROTO ((rtx));
 532 static int oprs_unchanged_p        PROTO ((rtx, rtx, int));
 533 static int oprs_anticipatable_p       PROTO ((rtx, rtx));
 534 static int oprs_available_p        PROTO ((rtx, rtx));
 535 static void insert_expr_in_table      PROTO ((rtx, enum machine_mode,
 536                                               rtx, int, int));
 537 static void insert_set_in_table       PROTO ((rtx, rtx));
 538 static unsigned int hash_expr    PROTO ((rtx, enum machine_mode,
 539                                          int *, int));
 540 static unsigned int hash_expr_1       PROTO ((rtx, enum machine_mode, int *));
 541 static unsigned int hash_set      PROTO ((int, int));
 542 static int expr_equiv_p        PROTO ((rtx, rtx));
 543 static void record_last_reg_set_info  PROTO ((rtx, int));
 544 static void record_last_mem_set_info  PROTO ((rtx));
 545 static void record_last_set_info      PROTO ((rtx, rtx));
 546 static void compute_hash_table  PROTO ((int));
 547 static void alloc_set_hash_table      PROTO ((int));
 548 static void free_set_hash_table       PROTO ((void));
 549 static void compute_set_hash_table    PROTO ((void));
 550 static void alloc_expr_hash_table     PROTO ((int));
 551 static void free_expr_hash_table      PROTO ((void));
 552 static void compute_expr_hash_table   PROTO ((void));
 553 static void dump_hash_table        PROTO ((FILE *, const char *, struct expr **,
 554                                            int, int));
 555 static struct expr *lookup_expr       PROTO ((rtx));
 556 static struct expr *lookup_set  PROTO ((int, rtx));
 557 static struct expr *next_set      PROTO ((int, struct expr *));
 558 static void reset_opr_set_tables      PROTO ((void));
 559 static int oprs_not_set_p            PROTO ((rtx, rtx));
 560 static void mark_call            PROTO ((rtx));
 561 static void mark_set              PROTO ((rtx, rtx));
 562 static void mark_clobber              PROTO ((rtx, rtx));
 563 static void mark_oprs_set            PROTO ((rtx));
 564
 565 static void alloc_cprop_mem        PROTO ((int, int));
 566 static void free_cprop_mem          PROTO ((void));
 567 static void compute_transp          PROTO ((rtx, int, sbitmap *, int));
 568 static void compute_transpout       PROTO ((void));
 569 static void compute_local_properties  PROTO ((sbitmap *, sbitmap *,
 570                                               sbitmap *, int));
 571 static void compute_cprop_avinout     PROTO ((void));
 572 static void compute_cprop_data  PROTO ((void));
 573 static void find_used_regs          PROTO ((rtx));
 574 static int try_replace_reg          PROTO ((rtx, rtx, rtx));
 575 static struct expr *find_avail_set    PROTO ((int, rtx));
 576 static int cprop_jump                   PROTO((rtx, rtx, struct reg_use *, rtx));
 577 #ifdef HAVE_cc0
 578 static int cprop_cc0_jump               PROTO((rtx, struct reg_use *, rtx));
 579 #endif
 580 static int cprop_insn            PROTO ((rtx, int));
 581 static int cprop                      PROTO ((int));
 582 static int one_cprop_pass            PROTO ((int, int));
 583
 584 static void alloc_pre_mem            PROTO ((int, int));
 585 static void free_pre_mem              PROTO ((void));
 586 static void compute_pre_data      PROTO ((void));
 587 static int pre_expr_reaches_here_p    PROTO ((int, struct expr *,
 588                                               int, int, char *));
 589 static void insert_insn_end_bb  PROTO ((struct expr *, int, int));
 590 static void pre_insert_copy_insn      PROTO ((struct expr *, rtx));
 591 static void pre_insert_copies    PROTO ((void));
 592 static int pre_delete            PROTO ((void));
 593 static int pre_gcse                PROTO ((void));
 594 static int one_pre_gcse_pass      PROTO ((int));
 595
 596 static void add_label_notes           PROTO ((rtx, rtx));
 597
 598 static void alloc_code_hoist_mem        PROTO ((int, int));
 599 static void free_code_hoist_mem         PROTO ((void));
 600 static void compute_code_hoist_vbeinout PROTO ((void));
 601 static void compute_code_hoist_data     PROTO ((void));
 602 static int hoist_expr_reaches_here_p    PROTO ((int, int, int, char *));
 603 static void hoist_code                  PROTO ((void));
 604 static int one_code_hoisting_pass       PROTO ((void));
 605
 606 static void alloc_rd_mem              PROTO ((int, int));
 607 static void free_rd_mem        PROTO ((void));
 608 static void handle_rd_kill_set  PROTO ((rtx, int, int));
 609 static void compute_kill_rd        PROTO ((void));
 610 static void compute_rd          PROTO ((void));
 611 static void alloc_avail_expr_mem      PROTO ((int, int));
 612 static void free_avail_expr_mem       PROTO ((void));
 613 static void compute_ae_gen          PROTO ((void));
 614 static int expr_killed_p              PROTO ((rtx, int));
 615 static void compute_ae_kill        PROTO ((sbitmap *, sbitmap *));
 616 static int expr_reaches_here_p  PROTO ((struct occr *, struct expr *,
 617                                               int, int, char *));
 618 static rtx computing_insn            PROTO ((struct expr *, rtx));
 619 static int def_reaches_here_p    PROTO ((rtx, rtx));
 620 static int can_disregard_other_sets   PROTO ((struct reg_set **, rtx, int));
 621 static int handle_avail_expr      PROTO ((rtx, struct expr *));
 622 static int classic_gcse        PROTO ((void));
 623 static int one_classic_gcse_pass      PROTO ((int));
 624
 625 static void invalidate_nonnull_info     PROTO ((rtx, rtx));
 626
 627 \f
 628 /* Entry point for global common subexpression elimination.
 629    F is the first instruction in the function.  */
 630
 631 int
 632 gcse_main (f, file)
 633      rtx f;
 634      FILE *file;
 635 {
 636   int changed, pass;
 637   /* Bytes used at start of pass.  */
 638   int initial_bytes_used;
 639   /* Maximum number of bytes used by a pass.  */
 640   int max_pass_bytes;
 641   /* Point to release obstack data from for each pass.  */
 642   char *gcse_obstack_bottom;
 643
 644   /* We do not construct an accurate cfg in functions which call
 645      setjmp, so just punt to be safe.  */
 646   if (current_function_calls_setjmp)
 647     return 0;
 648
 649   /* Assume that we do not need to run jump optimizations after gcse.  */
 650   run_jump_opt_after_gcse = 0;
 651
 652   /* For calling dump_foo fns from gdb.  */
 653   debug_stderr = stderr;
 654   gcse_file = file;
 655
 656   /* Identify the basic block information for this function, including
 657      successors and predecessors.  */
 658   max_gcse_regno = max_reg_num ();
 659   find_basic_blocks (f, max_gcse_regno, file, 1);
 660
 661   if (file)
 662     dump_flow_info (file);
 663
 664   /* Return if there's nothing to do.  */
 665   if (n_basic_blocks <= 1)
 666     {
 667       /* Free storage allocated by find_basic_blocks.  */
 668       free_basic_block_vars (0);
 669       return 0;
 670     }
 671
 672   /* Trying to perform global optimizations on flow graphs which have
 673      a high connectivity will take a long time and is unlikely to be
 674      particularly useful.
 675
 676      In normal circumstances a cfg should have about twice has many edges
 677      as blocks.  But we do not want to punish small functions which have
 678      a couple switch statements.  So we require a relatively large number
 679      of basic blocks and the ratio of edges to blocks to be high.  */
 680   if (n_basic_blocks > 1000 && n_edges / n_basic_blocks >= 20)
 681     {
 682       /* Free storage allocated by find_basic_blocks.  */
 683       free_basic_block_vars (0);
 684       return 0;
 685     }
 686
 687   /* See what modes support reg/reg copy operations.  */
 688   if (! can_copy_init_p)
 689     {
 690       compute_can_copy ();
 691       can_copy_init_p = 1;
 692     }
 693
 694   gcc_obstack_init (&gcse_obstack);
 695   bytes_used = 0;
 696
 697   /* Record where pseudo-registers are set.
 698      This data is kept accurate during each pass.
 699      ??? We could also record hard-reg information here
 700      [since it's unchanging], however it is currently done during
 701      hash table computation.
 702
 703      It may be tempting to compute MEM set information here too, but MEM
 704      sets will be subject to code motion one day and thus we need to compute
 705      information about memory sets when we build the hash tables.  */
 706
 707   alloc_reg_set_mem (max_gcse_regno);
 708   compute_sets (f);
 709
 710   pass = 0;
 711   initial_bytes_used = bytes_used;
 712   max_pass_bytes = 0;
 713   gcse_obstack_bottom = gcse_alloc (1);
 714   changed = 1;
 715   while (changed && pass < MAX_PASSES)
 716     {
 717       changed = 0;
 718       if (file)
 719         fprintf (file, "GCSE pass %d\n\n", pass + 1);
 720
 721       /* Initialize bytes_used to the space for the pred/succ lists,
 722          and the reg_set_table data.  */
 723       bytes_used = initial_bytes_used;
 724
 725       /* Each pass may create new registers, so recalculate each time.  */
 726       max_gcse_regno = max_reg_num ();
 727
 728       alloc_gcse_mem (f);
 729
 730       /* Don't allow constant propagation to modify jumps
 731          during this pass.  */
 732       changed = one_cprop_pass (pass + 1, 0);
 733
 734       if (optimize_size)
 735         changed |= one_classic_gcse_pass (pass + 1);
 736       else
 737         {
 738           changed |= one_pre_gcse_pass (pass + 1);
 739           free_reg_set_mem ();
 740           alloc_reg_set_mem (max_reg_num ());
 741           compute_sets (f);
 742           run_jump_opt_after_gcse = 1;
 743         }
 744
 745       if (max_pass_bytes < bytes_used)
 746         max_pass_bytes = bytes_used;
 747
 748       /* Free up memory, then reallocate for code hoisting.  We can
 749          not re-use the existing allocated memory because the tables
 750          will not have info for the insns or registers created by
 751          partial redundancy elimination.  */
 752       free_gcse_mem ();
 753
 754       /* It does not make sense to run code hoisting unless we optimizing
 755          for code size -- it rarely makes programs faster, and can make
 756          them bigger if we did partial redundancy elimination (when optimizing
 757          for space, we use a classic gcse algorithm instead of partial
 758          redundancy algorithms).  */
 759       if (optimize_size)
 760         {
 761           max_gcse_regno = max_reg_num ();
 762           alloc_gcse_mem (f);
 763           changed |= one_code_hoisting_pass ();
 764           free_gcse_mem ();
 765
 766           if (max_pass_bytes < bytes_used)
 767             max_pass_bytes = bytes_used;
 768         }
 769
 770       if (file)
 771         {
 772           fprintf (file, "\n");
 773           fflush (file);
 774         }
 775       obstack_free (&gcse_obstack, gcse_obstack_bottom);
 776       pass++;
 777     }
 778
 779   /* Do one last pass of copy propagation, including cprop into
 780      conditional jumps.  */
 781
 782   max_gcse_regno = max_reg_num ();
 783   alloc_gcse_mem (f);
 784   /* This time, go ahead and allow cprop to alter jumps.  */
 785   one_cprop_pass (pass + 1, 1);
 786   free_gcse_mem ();
 787
 788   if (file)
 789     {
 790       fprintf (file, "GCSE of %s: %d basic blocks, ",
 791                current_function_name, n_basic_blocks);
 792       fprintf (file, "%d pass%s, %d bytes\n\n",
 793                pass, pass > 1 ? "es" : "", max_pass_bytes);
 794     }
 795
 796   /* Free our obstack.  */
 797   obstack_free (&gcse_obstack, NULL_PTR);
 798   /* Free reg_set_table.  */
 799   free_reg_set_mem ();
 800   /* Free storage used to record predecessor/successor data.  */
 801   free_bb_mem ();
 802   /* Free storage allocated by find_basic_blocks.  */
 803   free_basic_block_vars (0);
 804   return run_jump_opt_after_gcse;
 805 }
 806 \f
 807 /* Misc. utilities.  */
 808
 809 /* Compute which modes support reg/reg copy operations.  */
 810
 811 static void
 812 compute_can_copy ()
 813 {
 814   int i;
 815 #ifndef AVOID_CCMODE_COPIES
 816   rtx reg,insn;
 817 #endif
 818   char *free_point = (char *) oballoc (1);
 819
 820   bzero (can_copy_p, NUM_MACHINE_MODES);
 821
 822   start_sequence ();
 823   for (i = 0; i < NUM_MACHINE_MODES; i++)
 824     {
 825       switch (GET_MODE_CLASS (i))
 826         {
 827         case MODE_CC :
 828 #ifdef AVOID_CCMODE_COPIES
 829           can_copy_p[i] = 0;
 830 #else
 831           reg = gen_rtx_REG ((enum machine_mode) i, LAST_VIRTUAL_REGISTER + 1);
 832           insn = emit_insn (gen_rtx_SET (VOIDmode, reg, reg));
 833           if (recog (PATTERN (insn), insn, NULL_PTR) >= 0)
 834             can_copy_p[i] = 1;
 835 #endif
 836           break;
 837         default :
 838           can_copy_p[i] = 1;
 839           break;
 840         }
 841     }
 842   end_sequence ();
 843
 844   /* Free the objects we just allocated.  */
 845   obfree (free_point);
 846 }
 847 \f
 848 /* Cover function to xmalloc to record bytes allocated.  */
 849
 850 static char *
 851 gmalloc (size)
 852      unsigned int size;
 853 {
 854   bytes_used += size;
 855   return xmalloc (size);
 856 }
 857
 858 /* Cover function to xrealloc.
 859    We don't record the additional size since we don't know it.
 860    It won't affect memory usage stats much anyway.  */
 861
 862 static char *
 863 grealloc (ptr, size)
 864      char *ptr;
 865      unsigned int size;
 866 {
 867   return xrealloc (ptr, size);
 868 }
 869
 870 /* Cover function to obstack_alloc.
 871    We don't need to record the bytes allocated here since
 872    obstack_chunk_alloc is set to gmalloc.  */
 873
 874 static char *
 875 gcse_alloc (size)
 876      unsigned long size;
 877 {
 878   return (char *) obstack_alloc (&gcse_obstack, size);
 879 }
 880
 881 /* Allocate memory for the cuid mapping array,
 882    and reg/memory set tracking tables.
 883
 884    This is called at the start of each pass.  */
 885
 886 static void
 887 alloc_gcse_mem (f)
 888      rtx f;
 889 {
 890   int i,n;
 891   rtx insn;
 892
 893   /* Find the largest UID and create a mapping from UIDs to CUIDs.
 894      CUIDs are like UIDs except they increase monotonically, have no gaps,
 895      and only apply to real insns.  */
 896
 897   max_uid = get_max_uid ();
 898   n = (max_uid + 1) * sizeof (int);
 899   uid_cuid = (int *) gmalloc (n);
 900   bzero ((char *) uid_cuid, n);
 901   for (insn = f, i = 0; insn; insn = NEXT_INSN (insn))
 902     {
 903       if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
 904         INSN_CUID (insn) = i++;
 905       else
 906         INSN_CUID (insn) = i;
 907     }
 908
 909   /* Create a table mapping cuids to insns.  */
 910
 911   max_cuid = i;
 912   n = (max_cuid + 1) * sizeof (rtx);
 913   cuid_insn = (rtx *) gmalloc (n);
 914   bzero ((char *) cuid_insn, n);
 915   for (insn = f, i = 0; insn; insn = NEXT_INSN (insn))
 916     {
 917       if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
 918         {
 919           CUID_INSN (i) = insn;
 920           i++;
 921         }
 922     }
 923
 924   /* Allocate vars to track sets of regs.  */
 925
 926   reg_set_bitmap = (sbitmap) sbitmap_alloc (max_gcse_regno);
 927
 928   /* Allocate vars to track sets of regs, memory per block.  */
 929
 930   reg_set_in_block = (sbitmap *) sbitmap_vector_alloc (n_basic_blocks,
 931                                                        max_gcse_regno);
 932   mem_set_in_block = (char *) gmalloc (n_basic_blocks);
 933 }
 934
 935 /* Free memory allocated by alloc_gcse_mem.  */
 936
 937 static void
 938 free_gcse_mem ()
 939 {
 940   free (uid_cuid);
 941   free (cuid_insn);
 942
 943   free (reg_set_bitmap);
 944
 945   free (reg_set_in_block);
 946   free (mem_set_in_block);
 947 }
 948
 949 \f
 950 /* Compute the local properties of each recorded expression.
 951    Local properties are those that are defined by the block, irrespective
 952    of other blocks.
 953
 954    An expression is transparent in a block if its operands are not modified
 955    in the block.
 956
 957    An expression is computed (locally available) in a block if it is computed
 958    at least once and expression would contain the same value if the
 959    computation was moved to the end of the block.
 960
 961    An expression is locally anticipatable in a block if it is computed at
 962    least once and expression would contain the same value if the computation
 963    was moved to the beginning of the block.
 964
 965    We call this routine for cprop, pre and code hoisting.  They all
 966    compute basically the same information and thus can easily share
 967    this code.
 968
 969    TRANSP, COMP, and ANTLOC are destination sbitmaps for recording
 970    local properties.  If NULL, then it is not necessary to compute
 971    or record that particular property.
 972
 973    SETP controls which hash table to look at.  If zero, this routine
 974    looks at the expr hash table; if nonzero this routine looks at
 975    the set hash table.  Additionally, TRANSP is computed as ~TRANSP,
 976    since this is really cprop's ABSALTERED.  */
 977
 978 static void
 979 compute_local_properties (transp, comp, antloc, setp)
 980      sbitmap *transp;
 981      sbitmap *comp;
 982      sbitmap *antloc;
 983      int setp;
 984 {
 985   int i, hash_table_size;
 986   struct expr **hash_table;
 987
 988   /* Initialize any bitmaps that were passed in.  */
 989   if (transp)
 990     {
 991       if (setp)
 992         sbitmap_vector_zero (transp, n_basic_blocks);
 993       else
 994         sbitmap_vector_ones (transp, n_basic_blocks);
 995     }
 996   if (comp)
 997     sbitmap_vector_zero (comp, n_basic_blocks);
 998   if (antloc)
 999     sbitmap_vector_zero (antloc, n_basic_blocks);
1000
1001   /* We use the same code for cprop, pre and hoisting.  For cprop
1002      we care about the set hash table, for pre and hoisting we
1003      care about the expr hash table.  */
1004   hash_table_size = setp ? set_hash_table_size : expr_hash_table_size;
1005   hash_table = setp ? set_hash_table : expr_hash_table;
1006
1007   for (i = 0; i < hash_table_size; i++)
1008     {
1009       struct expr *expr;
1010
1011       for (expr = hash_table[i]; expr != NULL; expr = expr->next_same_hash)
1012         {
1013           struct occr *occr;
1014           int indx = expr->bitmap_index;
1015
1016           /* The expression is transparent in this block if it is not killed.
1017              We start by assuming all are transparent [none are killed], and
1018              then reset the bits for those that are.  */
1019
1020           if (transp)
1021             compute_transp (expr->expr, indx, transp, setp);
1022
1023           /* The occurrences recorded in antic_occr are exactly those that
1024              we want to set to non-zero in ANTLOC.  */
1025
1026           if (antloc)
1027             {
1028               for (occr = expr->antic_occr; occr != NULL; occr = occr->next)
1029                 {
1030                   int bb = BLOCK_NUM (occr->insn);
1031                   SET_BIT (antloc[bb], indx);
1032
1033                   /* While we're scanning the table, this is a good place to
1034                      initialize this.  */
1035                   occr->deleted_p = 0;
1036                 }
1037             }
1038
1039           /* The occurrences recorded in avail_occr are exactly those that
1040              we want to set to non-zero in COMP.  */
1041           if (comp)
1042             {
1043
1044               for (occr = expr->avail_occr; occr != NULL; occr = occr->next)
1045                 {
1046                   int bb = BLOCK_NUM (occr->insn);
1047                   SET_BIT (comp[bb], indx);
1048
1049                   /* While we're scanning the table, this is a good place to
1050                      initialize this.  */
1051                   occr->copied_p = 0;
1052                 }
1053             }
1054
1055           /* While we're scanning the table, this is a good place to
1056              initialize this.  */
1057           expr->reaching_reg = 0;
1058         }
1059     }
1060 }
1061
1062 \f
1063 /* Register set information.
1064
1065    `reg_set_table' records where each register is set or otherwise
1066    modified.  */
1067
1068 static struct obstack reg_set_obstack;
1069
1070 static void
1071 alloc_reg_set_mem (n_regs)
1072      int n_regs;
1073 {
1074   int n;
1075
1076   reg_set_table_size = n_regs + REG_SET_TABLE_SLOP;
1077   n = reg_set_table_size * sizeof (struct reg_set *);
1078   reg_set_table = (struct reg_set **) gmalloc (n);
1079   bzero ((char *) reg_set_table, n);
1080
1081   gcc_obstack_init (&reg_set_obstack);
1082 }
1083
1084 static void
1085 free_reg_set_mem ()
1086 {
1087   free (reg_set_table);
1088   obstack_free (&reg_set_obstack, NULL_PTR);
1089 }
1090
1091 /* Record REGNO in the reg_set table.  */
1092
1093 static void
1094 record_one_set (regno, insn)
1095      int regno;
1096      rtx insn;
1097 {
1098   /* allocate a new reg_set element and link it onto the list */
1099   struct reg_set *new_reg_info, *reg_info_ptr1, *reg_info_ptr2;
1100
1101   /* If the table isn't big enough, enlarge it.  */
1102   if (regno >= reg_set_table_size)
1103     {
1104       int new_size = regno + REG_SET_TABLE_SLOP;
1105       reg_set_table = (struct reg_set **)
1106         grealloc ((char *) reg_set_table,
1107                   new_size * sizeof (struct reg_set *));
1108       bzero ((char *) (reg_set_table + reg_set_table_size),
1109              (new_size - reg_set_table_size) * sizeof (struct reg_set *));
1110       reg_set_table_size = new_size;
1111     }
1112
1113   new_reg_info = (struct reg_set *) obstack_alloc (&reg_set_obstack,
1114                                                    sizeof (struct reg_set));
1115   bytes_used += sizeof (struct reg_set);
1116   new_reg_info->insn = insn;
1117   new_reg_info->next = NULL;
1118   if (reg_set_table[regno] == NULL)
1119     reg_set_table[regno] = new_reg_info;
1120   else
1121     {
1122       reg_info_ptr1 = reg_info_ptr2 = reg_set_table[regno];
1123       /* ??? One could keep a "last" pointer to speed this up.  */
1124       while (reg_info_ptr1 != NULL)
1125         {
1126           reg_info_ptr2 = reg_info_ptr1;
1127           reg_info_ptr1 = reg_info_ptr1->next;
1128         }
1129       reg_info_ptr2->next = new_reg_info;
1130     }
1131 }
1132
1133 /* For communication between next two functions (via note_stores).  */
1134 static rtx record_set_insn;
1135
1136 /* Called from compute_sets via note_stores to handle one
1137    SET or CLOBBER in an insn.  */
1138
1139 static void
1140 record_set_info (dest, setter)
1141      rtx dest, setter ATTRIBUTE_UNUSED;
1142 {
1143   if (GET_CODE (dest) == SUBREG)
1144     dest = SUBREG_REG (dest);
1145
1146   if (GET_CODE (dest) == REG)
1147     {
1148       if (REGNO (dest) >= FIRST_PSEUDO_REGISTER)
1149         record_one_set (REGNO (dest), record_set_insn);
1150     }
1151 }
1152
1153 /* Scan the function and record each set of each pseudo-register.
1154
1155    This is called once, at the start of the gcse pass.
1156    See the comments for `reg_set_table' for further docs.  */
1157
1158 static void
1159 compute_sets (f)
1160      rtx f;
1161 {
1162   rtx insn = f;
1163
1164   while (insn)
1165     {
1166       if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
1167         {
1168           record_set_insn = insn;
1169           note_stores (PATTERN (insn), record_set_info);
1170         }
1171       insn = NEXT_INSN (insn);
1172     }
1173 }
1174 \f
1175 /* Hash table support.  */
1176
1177 #define NEVER_SET -1
1178
1179 /* For each register, the cuid of the first/last insn in the block to set it,
1180    or -1 if not set.  */
1181 static int *reg_first_set;
1182 static int *reg_last_set;
1183
1184 /* While computing "first/last set" info, this is the CUID of first/last insn
1185    to set memory or -1 if not set.  `mem_last_set' is also used when
1186    performing GCSE to record whether memory has been set since the beginning
1187    of the block.
1188    Note that handling of memory is very simple, we don't make any attempt
1189    to optimize things (later).  */
1190 static int mem_first_set;
1191 static int mem_last_set;
1192
1193 /* Perform a quick check whether X, the source of a set, is something
1194    we want to consider for GCSE.  */
1195
1196 static int
1197 want_to_gcse_p (x)
1198      rtx x;
1199 {
1200   enum rtx_code code = GET_CODE (x);
1201
1202   switch (code)
1203     {
1204     case REG:
1205     case SUBREG:
1206     case CONST_INT:
1207     case CONST_DOUBLE:
1208     case CALL:
1209       return 0;
1210
1211     default:
1212       break;
1213     }
1214
1215   return 1;
1216 }
1217
1218 /* Return non-zero if the operands of expression X are unchanged from the
1219    start of INSN's basic block up to but not including INSN (if AVAIL_P == 0),
1220    or from INSN to the end of INSN's basic block (if AVAIL_P != 0).  */
1221
1222 static int
1223 oprs_unchanged_p (x, insn, avail_p)
1224      rtx x, insn;
1225      int avail_p;
1226 {
1227   int i;
1228   enum rtx_code code;
1229   const char *fmt;
1230
1231   /* repeat is used to turn tail-recursion into iteration.  */
1232  repeat:
1233
1234   if (x == 0)
1235     return 1;
1236
1237   code = GET_CODE (x);
1238   switch (code)
1239     {
1240     case REG:
1241       if (avail_p)
1242         return (reg_last_set[REGNO (x)] == NEVER_SET
1243                 || reg_last_set[REGNO (x)] < INSN_CUID (insn));
1244       else
1245         return (reg_first_set[REGNO (x)] == NEVER_SET
1246                 || reg_first_set[REGNO (x)] >= INSN_CUID (insn));
1247
1248     case MEM:
1249       if (avail_p)
1250         {
1251           if (mem_last_set != NEVER_SET
1252               && mem_last_set >= INSN_CUID (insn))
1253             return 0;
1254         }
1255       else
1256         {
1257           if (mem_first_set != NEVER_SET
1258               && mem_first_set < INSN_CUID (insn))
1259             return 0;
1260         }
1261       x = XEXP (x, 0);
1262       goto repeat;
1263
1264     case PRE_DEC:
1265     case PRE_INC:
1266     case POST_DEC:
1267     case POST_INC:
1268       return 0;
1269
1270     case PC:
1271     case CC0: /*FIXME*/
1272     case CONST:
1273     case CONST_INT:
1274     case CONST_DOUBLE:
1275     case SYMBOL_REF:
1276     case LABEL_REF:
1277     case ADDR_VEC:
1278     case ADDR_DIFF_VEC:
1279       return 1;
1280
1281     default:
1282       break;
1283     }
1284
1285   i = GET_RTX_LENGTH (code) - 1;
1286   fmt = GET_RTX_FORMAT (code);
1287   for (; i >= 0; i--)
1288     {
1289       if (fmt[i] == 'e')
1290         {
1291           rtx tem = XEXP (x, i);
1292
1293           /* If we are about to do the last recursive call
1294              needed at this level, change it into iteration.
1295              This function is called enough to be worth it.  */
1296           if (i == 0)
1297             {
1298               x = tem;
1299               goto repeat;
1300             }
1301           if (! oprs_unchanged_p (tem, insn, avail_p))
1302             return 0;
1303         }
1304       else if (fmt[i] == 'E')
1305         {
1306           int j;
1307           for (j = 0; j < XVECLEN (x, i); j++)
1308             {
1309               if (! oprs_unchanged_p (XVECEXP (x, i, j), insn, avail_p))
1310                 return 0;
1311             }
1312         }
1313     }
1314
1315   return 1;
1316 }
1317
1318 /* Return non-zero if the operands of expression X are unchanged from
1319    the start of INSN's basic block up to but not including INSN.  */
1320
1321 static int
1322 oprs_anticipatable_p (x, insn)
1323      rtx x, insn;
1324 {
1325   return oprs_unchanged_p (x, insn, 0);
1326 }
1327
1328 /* Return non-zero if the operands of expression X are unchanged from
1329    INSN to the end of INSN's basic block.  */
1330
1331 static int
1332 oprs_available_p (x, insn)
1333      rtx x, insn;
1334 {
1335   return oprs_unchanged_p (x, insn, 1);
1336 }
1337
1338 /* Hash expression X.
1339    MODE is only used if X is a CONST_INT.
1340    A boolean indicating if a volatile operand is found or if the expression
1341    contains something we don't want to insert in the table is stored in
1342    DO_NOT_RECORD_P.
1343
1344    ??? One might want to merge this with canon_hash.  Later.  */
1345
1346 static unsigned int
1347 hash_expr (x, mode, do_not_record_p, hash_table_size)
1348      rtx x;
1349      enum machine_mode mode;
1350      int *do_not_record_p;
1351      int hash_table_size;
1352 {
1353   unsigned int hash;
1354
1355   *do_not_record_p = 0;
1356
1357   hash = hash_expr_1 (x, mode, do_not_record_p);
1358   return hash % hash_table_size;
1359 }
1360
1361 /* Subroutine of hash_expr to do the actual work.  */
1362
1363 static unsigned int
1364 hash_expr_1 (x, mode, do_not_record_p)
1365      rtx x;
1366      enum machine_mode mode;
1367      int *do_not_record_p;
1368 {
1369   int i, j;
1370   unsigned hash = 0;
1371   enum rtx_code code;
1372   const char *fmt;
1373
1374   /* repeat is used to turn tail-recursion into iteration.  */
1375  repeat:
1376
1377   if (x == 0)
1378     return hash;
1379
1380   code = GET_CODE (x);
1381   switch (code)
1382     {
1383     case REG:
1384       {
1385         register int regno = REGNO (x);
1386         hash += ((unsigned) REG << 7) + regno;
1387         return hash;
1388       }
1389
1390     case CONST_INT:
1391       {
1392         unsigned HOST_WIDE_INT tem = INTVAL (x);
1393         hash += ((unsigned) CONST_INT << 7) + (unsigned) mode + tem;
1394         return hash;
1395       }
1396
1397     case CONST_DOUBLE:
1398       /* This is like the general case, except that it only counts
1399          the integers representing the constant.  */
1400       hash += (unsigned) code + (unsigned) GET_MODE (x);
1401       if (GET_MODE (x) != VOIDmode)
1402         for (i = 2; i < GET_RTX_LENGTH (CONST_DOUBLE); i++)
1403           {
1404             unsigned tem = XWINT (x, i);
1405             hash += tem;
1406           }
1407       else
1408         hash += ((unsigned) CONST_DOUBLE_LOW (x)
1409                  + (unsigned) CONST_DOUBLE_HIGH (x));
1410       return hash;
1411
1412       /* Assume there is only one rtx object for any given label.  */
1413     case LABEL_REF:
1414       /* We don't hash on the address of the CODE_LABEL to avoid bootstrap
1415          differences and differences between each stage's debugging dumps.  */
1416       hash += ((unsigned) LABEL_REF << 7) + CODE_LABEL_NUMBER (XEXP (x, 0));
1417       return hash;
1418
1419     case SYMBOL_REF:
1420       {
1421         /* Don't hash on the symbol's address to avoid bootstrap differences.
1422            Different hash values may cause expressions to be recorded in
1423            different orders and thus different registers to be used in the
1424            final assembler.  This also avoids differences in the dump files
1425            between various stages.  */
1426         unsigned int h = 0;
1427         unsigned char *p = (unsigned char *) XSTR (x, 0);
1428         while (*p)
1429           h += (h << 7) + *p++; /* ??? revisit */
1430         hash += ((unsigned) SYMBOL_REF << 7) + h;
1431         return hash;
1432       }
1433
1434     case MEM:
1435       if (MEM_VOLATILE_P (x))
1436         {
1437           *do_not_record_p = 1;
1438           return 0;
1439         }
1440       hash += (unsigned) MEM;
1441       hash += MEM_ALIAS_SET (x);
1442       x = XEXP (x, 0);
1443       goto repeat;
1444
1445     case PRE_DEC:
1446     case PRE_INC:
1447     case POST_DEC:
1448     case POST_INC:
1449     case PC:
1450     case CC0:
1451     case CALL:
1452     case UNSPEC_VOLATILE:
1453       *do_not_record_p = 1;
1454       return 0;
1455
1456     case ASM_OPERANDS:
1457       if (MEM_VOLATILE_P (x))
1458         {
1459           *do_not_record_p = 1;
1460           return 0;
1461         }
1462
1463     default:
1464       break;
1465     }
1466
1467   i = GET_RTX_LENGTH (code) - 1;
1468   hash += (unsigned) code + (unsigned) GET_MODE (x);
1469   fmt = GET_RTX_FORMAT (code);
1470   for (; i >= 0; i--)
1471     {
1472       if (fmt[i] == 'e')
1473         {
1474           rtx tem = XEXP (x, i);
1475
1476           /* If we are about to do the last recursive call
1477              needed at this level, change it into iteration.
1478              This function is called enough to be worth it.  */
1479           if (i == 0)
1480             {
1481               x = tem;
1482               goto repeat;
1483             }
1484           hash += hash_expr_1 (tem, 0, do_not_record_p);
1485           if (*do_not_record_p)
1486             return 0;
1487         }
1488       else if (fmt[i] == 'E')
1489         for (j = 0; j < XVECLEN (x, i); j++)
1490           {
1491             hash += hash_expr_1 (XVECEXP (x, i, j), 0, do_not_record_p);
1492             if (*do_not_record_p)
1493               return 0;
1494           }
1495       else if (fmt[i] == 's')
1496         {
1497           register unsigned char *p = (unsigned char *) XSTR (x, i);
1498           if (p)
1499             while (*p)
1500               hash += *p++;
1501         }
1502       else if (fmt[i] == 'i')
1503         {
1504           register unsigned tem = XINT (x, i);
1505           hash += tem;
1506         }
1507       else
1508         abort ();
1509     }
1510
1511   return hash;
1512 }
1513
1514 /* Hash a set of register REGNO.
1515
1516    Sets are hashed on the register that is set.
1517    This simplifies the PRE copy propagation code.
1518
1519    ??? May need to make things more elaborate.  Later, as necessary.  */
1520
1521 static unsigned int
1522 hash_set (regno, hash_table_size)
1523      int regno;
1524      int hash_table_size;
1525 {
1526   unsigned int hash;
1527
1528   hash = regno;
1529   return hash % hash_table_size;
1530 }
1531
1532 /* Return non-zero if exp1 is equivalent to exp2.
1533    ??? Borrowed from cse.c.  Might want to remerge with cse.c.  Later.  */
1534
1535 static int
1536 expr_equiv_p (x, y)
1537      rtx x, y;
1538 {
1539   register int i, j;
1540   register enum rtx_code code;
1541   register const char *fmt;
1542
1543   if (x == y)
1544     return 1;
1545   if (x == 0 || y == 0)
1546     return x == y;
1547
1548   code = GET_CODE (x);
1549   if (code != GET_CODE (y))
1550     return 0;
1551
1552   /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.  */
1553   if (GET_MODE (x) != GET_MODE (y))
1554     return 0;
1555
1556   switch (code)
1557     {
1558     case PC:
1559     case CC0:
1560       return x == y;
1561
1562     case CONST_INT:
1563       return INTVAL (x) == INTVAL (y);
1564
1565     case LABEL_REF:
1566       return XEXP (x, 0) == XEXP (y, 0);
1567
1568     case SYMBOL_REF:
1569       return XSTR (x, 0) == XSTR (y, 0);
1570
1571     case REG:
1572       return REGNO (x) == REGNO (y);
1573
1574     case MEM:
1575       /* Can't merge two expressions in different alias sets, since we can
1576          decide that the expression is transparent in a block when it isn't,
1577          due to it being set with the different alias set.  */
1578       if (MEM_ALIAS_SET (x) != MEM_ALIAS_SET (y))
1579         return 0;
1580       break;
1581
1582     /*  For commutative operations, check both orders.  */
1583     case PLUS:
1584     case MULT:
1585     case AND:
1586     case IOR:
1587     case XOR:
1588     case NE:
1589     case EQ:
1590       return ((expr_equiv_p (XEXP (x, 0), XEXP (y, 0))
1591                && expr_equiv_p (XEXP (x, 1), XEXP (y, 1)))
1592               || (expr_equiv_p (XEXP (x, 0), XEXP (y, 1))
1593                   && expr_equiv_p (XEXP (x, 1), XEXP (y, 0))));
1594
1595     default:
1596       break;
1597     }
1598
1599   /* Compare the elements.  If any pair of corresponding elements
1600      fail to match, return 0 for the whole thing.  */
1601
1602   fmt = GET_RTX_FORMAT (code);
1603   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1604     {
1605       switch (fmt[i])
1606         {
1607         case 'e':
1608           if (! expr_equiv_p (XEXP (x, i), XEXP (y, i)))
1609             return 0;
1610           break;
1611
1612         case 'E':
1613           if (XVECLEN (x, i) != XVECLEN (y, i))
1614             return 0;
1615           for (j = 0; j < XVECLEN (x, i); j++)
1616             if (! expr_equiv_p (XVECEXP (x, i, j), XVECEXP (y, i, j)))
1617               return 0;
1618           break;
1619
1620         case 's':
1621           if (strcmp (XSTR (x, i), XSTR (y, i)))
1622             return 0;
1623           break;
1624
1625         case 'i':
1626           if (XINT (x, i) != XINT (y, i))
1627             return 0;
1628           break;
1629
1630         case 'w':
1631           if (XWINT (x, i) != XWINT (y, i))
1632             return 0;
1633         break;
1634
1635         case '0':
1636           break;
1637
1638         default:
1639           abort ();
1640         }
1641       }
1642
1643   return 1;
1644 }
1645
1646 /* Insert expression X in INSN in the hash table.
1647    If it is already present, record it as the last occurrence in INSN's
1648    basic block.
1649
1650    MODE is the mode of the value X is being stored into.
1651    It is only used if X is a CONST_INT.
1652
1653    ANTIC_P is non-zero if X is an anticipatable expression.
1654    AVAIL_P is non-zero if X is an available expression.  */
1655
1656 static void
1657 insert_expr_in_table (x, mode, insn, antic_p, avail_p)
1658      rtx x;
1659      enum machine_mode mode;
1660      rtx insn;
1661      int antic_p, avail_p;
1662 {
1663   int found, do_not_record_p;
1664   unsigned int hash;
1665   struct expr *cur_expr, *last_expr = NULL;
1666   struct occr *antic_occr, *avail_occr;
1667   struct occr *last_occr = NULL;
1668
1669   hash = hash_expr (x, mode, &do_not_record_p, expr_hash_table_size);
1670
1671   /* Do not insert expression in table if it contains volatile operands,
1672      or if hash_expr determines the expression is something we don't want
1673      to or can't handle.  */
1674   if (do_not_record_p)
1675     return;
1676
1677   cur_expr = expr_hash_table[hash];
1678   found = 0;
1679
1680   while (cur_expr && ! (found = expr_equiv_p (cur_expr->expr, x)))
1681     {
1682       /* If the expression isn't found, save a pointer to the end of
1683          the list.  */
1684       last_expr = cur_expr;
1685       cur_expr = cur_expr->next_same_hash;
1686     }
1687
1688   if (! found)
1689     {
1690       cur_expr = (struct expr *) gcse_alloc (sizeof (struct expr));
1691       bytes_used += sizeof (struct expr);
1692       if (expr_hash_table[hash] == NULL)
1693         {
1694           /* This is the first pattern that hashed to this index.  */
1695           expr_hash_table[hash] = cur_expr;
1696         }
1697       else
1698         {
1699           /* Add EXPR to end of this hash chain.  */
1700           last_expr->next_same_hash = cur_expr;
1701         }
1702       /* Set the fields of the expr element.  */
1703       cur_expr->expr = x;
1704       cur_expr->bitmap_index = n_exprs++;
1705       cur_expr->next_same_hash = NULL;
1706       cur_expr->antic_occr = NULL;
1707       cur_expr->avail_occr = NULL;
1708     }
1709
1710   /* Now record the occurrence(s).  */
1711
1712   if (antic_p)
1713     {
1714       antic_occr = cur_expr->antic_occr;
1715
1716       /* Search for another occurrence in the same basic block.  */
1717       while (antic_occr && BLOCK_NUM (antic_occr->insn) != BLOCK_NUM (insn))
1718         {
1719           /* If an occurrence isn't found, save a pointer to the end of
1720              the list.  */
1721           last_occr = antic_occr;
1722           antic_occr = antic_occr->next;
1723         }
1724
1725       if (antic_occr)
1726         {
1727           /* Found another instance of the expression in the same basic block.
1728              Prefer the currently recorded one.  We want the first one in the
1729              block and the block is scanned from start to end.  */
1730           ; /* nothing to do */
1731         }
1732       else
1733         {
1734           /* First occurrence of this expression in this basic block.  */
1735           antic_occr = (struct occr *) gcse_alloc (sizeof (struct occr));
1736           bytes_used += sizeof (struct occr);
1737           /* First occurrence of this expression in any block?  */
1738           if (cur_expr->antic_occr == NULL)
1739             cur_expr->antic_occr = antic_occr;
1740           else
1741             last_occr->next = antic_occr;
1742           antic_occr->insn = insn;
1743           antic_occr->next = NULL;
1744         }
1745     }
1746
1747   if (avail_p)
1748     {
1749       avail_occr = cur_expr->avail_occr;
1750
1751       /* Search for another occurrence in the same basic block.  */
1752       while (avail_occr && BLOCK_NUM (avail_occr->insn) != BLOCK_NUM (insn))
1753         {
1754           /* If an occurrence isn't found, save a pointer to the end of
1755              the list.  */
1756           last_occr = avail_occr;
1757           avail_occr = avail_occr->next;
1758         }
1759
1760       if (avail_occr)
1761         {
1762           /* Found another instance of the expression in the same basic block.
1763              Prefer this occurrence to the currently recorded one.  We want
1764              the last one in the block and the block is scanned from start
1765              to end.  */
1766           avail_occr->insn = insn;
1767         }
1768       else
1769         {
1770           /* First occurrence of this expression in this basic block.  */
1771           avail_occr = (struct occr *) gcse_alloc (sizeof (struct occr));
1772           bytes_used += sizeof (struct occr);
1773           /* First occurrence of this expression in any block?  */
1774           if (cur_expr->avail_occr == NULL)
1775             cur_expr->avail_occr = avail_occr;
1776           else
1777             last_occr->next = avail_occr;
1778           avail_occr->insn = insn;
1779           avail_occr->next = NULL;
1780         }
1781     }
1782 }
1783
1784 /* Insert pattern X in INSN in the hash table.
1785    X is a SET of a reg to either another reg or a constant.
1786    If it is already present, record it as the last occurrence in INSN's
1787    basic block.  */
1788
1789 static void
1790 insert_set_in_table (x, insn)
1791      rtx x;
1792      rtx insn;
1793 {
1794   int found;
1795   unsigned int hash;
1796   struct expr *cur_expr, *last_expr = NULL;
1797   struct occr *cur_occr, *last_occr = NULL;
1798
1799   if (GET_CODE (x) != SET
1800       || GET_CODE (SET_DEST (x)) != REG)
1801     abort ();
1802
1803   hash = hash_set (REGNO (SET_DEST (x)), set_hash_table_size);
1804
1805   cur_expr = set_hash_table[hash];
1806   found = 0;
1807
1808   while (cur_expr && ! (found = expr_equiv_p (cur_expr->expr, x)))
1809     {
1810       /* If the expression isn't found, save a pointer to the end of
1811          the list.  */
1812       last_expr = cur_expr;
1813       cur_expr = cur_expr->next_same_hash;
1814     }
1815
1816   if (! found)
1817     {
1818       cur_expr = (struct expr *) gcse_alloc (sizeof (struct expr));
1819       bytes_used += sizeof (struct expr);
1820       if (set_hash_table[hash] == NULL)
1821         {
1822           /* This is the first pattern that hashed to this index.  */
1823           set_hash_table[hash] = cur_expr;
1824         }
1825       else
1826         {
1827           /* Add EXPR to end of this hash chain.  */
1828           last_expr->next_same_hash = cur_expr;
1829         }
1830       /* Set the fields of the expr element.
1831          We must copy X because it can be modified when copy propagation is
1832          performed on its operands.  */
1833       /* ??? Should this go in a different obstack?  */
1834       cur_expr->expr = copy_rtx (x);
1835       cur_expr->bitmap_index = n_sets++;
1836       cur_expr->next_same_hash = NULL;
1837       cur_expr->antic_occr = NULL;
1838       cur_expr->avail_occr = NULL;
1839     }
1840
1841   /* Now record the occurrence.  */
1842
1843   cur_occr = cur_expr->avail_occr;
1844
1845   /* Search for another occurrence in the same basic block.  */
1846   while (cur_occr && BLOCK_NUM (cur_occr->insn) != BLOCK_NUM (insn))
1847     {
1848       /* If an occurrence isn't found, save a pointer to the end of
1849          the list.  */
1850       last_occr = cur_occr;
1851       cur_occr = cur_occr->next;
1852     }
1853
1854   if (cur_occr)
1855     {
1856       /* Found another instance of the expression in the same basic block.
1857          Prefer this occurrence to the currently recorded one.  We want
1858          the last one in the block and the block is scanned from start
1859          to end.  */
1860       cur_occr->insn = insn;
1861     }
1862   else
1863     {
1864       /* First occurrence of this expression in this basic block.  */
1865       cur_occr = (struct occr *) gcse_alloc (sizeof (struct occr));
1866       bytes_used += sizeof (struct occr);
1867       /* First occurrence of this expression in any block?  */
1868       if (cur_expr->avail_occr == NULL)
1869         cur_expr->avail_occr = cur_occr;
1870       else
1871         last_occr->next = cur_occr;
1872       cur_occr->insn = insn;
1873       cur_occr->next = NULL;
1874     }
1875 }
1876
1877 /* Scan pattern PAT of INSN and add an entry to the hash table.
1878    If SET_P is non-zero, this is for the assignment hash table,
1879    otherwise it is for the expression hash table.  */
1880
1881 static void
1882 hash_scan_set (pat, insn, set_p)
1883      rtx pat, insn;
1884      int set_p;
1885 {
1886   rtx src = SET_SRC (pat);
1887   rtx dest = SET_DEST (pat);
1888
1889   if (GET_CODE (src) == CALL)
1890     hash_scan_call (src, insn);
1891
1892   if (GET_CODE (dest) == REG)
1893     {
1894       int regno = REGNO (dest);
1895       rtx tmp;
1896
1897       /* Only record sets of pseudo-regs in the hash table.  */
1898       if (! set_p
1899           && regno >= FIRST_PSEUDO_REGISTER
1900           /* Don't GCSE something if we can't do a reg/reg copy.  */
1901           && can_copy_p [GET_MODE (dest)]
1902           /* Is SET_SRC something we want to gcse?  */
1903           && want_to_gcse_p (src))
1904         {
1905           /* An expression is not anticipatable if its operands are
1906              modified before this insn.  */
1907           int antic_p = oprs_anticipatable_p (src, insn);
1908           /* An expression is not available if its operands are
1909              subsequently modified, including this insn.  */
1910           int avail_p = oprs_available_p (src, insn);
1911           insert_expr_in_table (src, GET_MODE (dest), insn, antic_p, avail_p);
1912         }
1913       /* Record sets for constant/copy propagation.  */
1914       else if (set_p
1915                && regno >= FIRST_PSEUDO_REGISTER
1916                && ((GET_CODE (src) == REG
1917                     && REGNO (src) >= FIRST_PSEUDO_REGISTER
1918                     && can_copy_p [GET_MODE (dest)])
1919                    || GET_CODE (src) == CONST_INT
1920                    || GET_CODE (src) == SYMBOL_REF
1921                    || GET_CODE (src) == CONST_DOUBLE)
1922                /* A copy is not available if its src or dest is subsequently
1923                   modified.  Here we want to search from INSN+1 on, but
1924                   oprs_available_p searches from INSN on.  */
1925                && (insn == BLOCK_END (BLOCK_NUM (insn))
1926                    || ((tmp = next_nonnote_insn (insn)) != NULL_RTX
1927                        && oprs_available_p (pat, tmp))))
1928         insert_set_in_table (pat, insn);
1929     }
1930 }
1931
1932 static void
1933 hash_scan_clobber (x, insn)
1934      rtx x ATTRIBUTE_UNUSED, insn ATTRIBUTE_UNUSED;
1935 {
1936   /* Currently nothing to do.  */
1937 }
1938
1939 static void
1940 hash_scan_call (x, insn)
1941      rtx x ATTRIBUTE_UNUSED, insn ATTRIBUTE_UNUSED;
1942 {
1943   /* Currently nothing to do.  */
1944 }
1945
1946 /* Process INSN and add hash table entries as appropriate.
1947
1948    Only available expressions that set a single pseudo-reg are recorded.
1949
1950    Single sets in a PARALLEL could be handled, but it's an extra complication
1951    that isn't dealt with right now.  The trick is handling the CLOBBERs that
1952    are also in the PARALLEL.  Later.
1953
1954    If SET_P is non-zero, this is for the assignment hash table,
1955    otherwise it is for the expression hash table.
1956    If IN_LIBCALL_BLOCK nonzero, we are in a libcall block, and should
1957    not record any expressions.  */
1958
1959 static void
1960 hash_scan_insn (insn, set_p, in_libcall_block)
1961      rtx insn;
1962      int set_p;
1963      int in_libcall_block;
1964 {
1965   rtx pat = PATTERN (insn);
1966
1967   /* Pick out the sets of INSN and for other forms of instructions record
1968      what's been modified.  */
1969
1970   if (GET_CODE (pat) == SET && ! in_libcall_block)
1971     {
1972       /* Ignore obvious no-ops.  */
1973       if (SET_SRC (pat) != SET_DEST (pat))
1974         hash_scan_set (pat, insn, set_p);
1975     }
1976   else if (GET_CODE (pat) == PARALLEL)
1977     {
1978       int i;
1979
1980       for (i = 0; i < XVECLEN (pat, 0); i++)
1981         {
1982           rtx x = XVECEXP (pat, 0, i);
1983
1984           if (GET_CODE (x) == SET)
1985             {
1986               if (GET_CODE (SET_SRC (x)) == CALL)
1987                 hash_scan_call (SET_SRC (x), insn);
1988             }
1989           else if (GET_CODE (x) == CLOBBER)
1990             hash_scan_clobber (x, insn);
1991           else if (GET_CODE (x) == CALL)
1992             hash_scan_call (x, insn);
1993         }
1994     }
1995   else if (GET_CODE (pat) == CLOBBER)
1996     hash_scan_clobber (pat, insn);
1997   else if (GET_CODE (pat) == CALL)
1998     hash_scan_call (pat, insn);
1999 }
2000
2001 static void
2002 dump_hash_table (file, name, table, table_size, total_size)
2003      FILE *file;
2004      const char *name;
2005      struct expr **table;
2006      int table_size, total_size;
2007 {
2008   int i;
2009   /* Flattened out table, so it's printed in proper order.  */
2010   struct expr **flat_table = (struct expr **) alloca (total_size * sizeof (struct expr *));
2011   unsigned int *hash_val = (unsigned int *) alloca (total_size * sizeof (unsigned int));
2012
2013   bzero ((char *) flat_table, total_size * sizeof (struct expr *));
2014   for (i = 0; i < table_size; i++)
2015     {
2016       struct expr *expr;
2017
2018       for (expr = table[i]; expr != NULL; expr = expr->next_same_hash)
2019         {
2020           flat_table[expr->bitmap_index] = expr;
2021           hash_val[expr->bitmap_index] = i;
2022         }
2023     }
2024
2025   fprintf (file, "%s hash table (%d buckets, %d entries)\n",
2026            name, table_size, total_size);
2027
2028   for (i = 0; i < total_size; i++)
2029     {
2030       struct expr *expr = flat_table[i];
2031
2032       fprintf (file, "Index %d (hash value %d)\n  ",
2033                expr->bitmap_index, hash_val[i]);
2034       print_rtl (file, expr->expr);
2035       fprintf (file, "\n");
2036     }
2037
2038   fprintf (file, "\n");
2039 }
2040
2041 /* Record register first/last/block set information for REGNO in INSN.
2042    reg_first_set records the first place in the block where the register
2043    is set and is used to compute "anticipatability".
2044    reg_last_set records the last place in the block where the register
2045    is set and is used to compute "availability".
2046    reg_set_in_block records whether the register is set in the block
2047    and is used to compute "transparency".  */
2048
2049 static void
2050 record_last_reg_set_info (insn, regno)
2051      rtx insn;
2052      int regno;
2053 {
2054   if (reg_first_set[regno] == NEVER_SET)
2055     reg_first_set[regno] = INSN_CUID (insn);
2056   reg_last_set[regno] = INSN_CUID (insn);
2057   SET_BIT (reg_set_in_block[BLOCK_NUM (insn)], regno);
2058 }
2059
2060 /* Record memory first/last/block set information for INSN.  */
2061
2062 static void
2063 record_last_mem_set_info (insn)
2064      rtx insn;
2065 {
2066   if (mem_first_set == NEVER_SET)
2067     mem_first_set = INSN_CUID (insn);
2068   mem_last_set = INSN_CUID (insn);
2069   mem_set_in_block[BLOCK_NUM (insn)] = 1;
2070 }
2071
2072 /* Used for communicating between next two routines.  */
2073 static rtx last_set_insn;
2074
2075 /* Called from compute_hash_table via note_stores to handle one
2076    SET or CLOBBER in an insn.  */
2077
2078 static void
2079 record_last_set_info (dest, setter)
2080      rtx dest, setter ATTRIBUTE_UNUSED;
2081 {
2082   if (GET_CODE (dest) == SUBREG)
2083     dest = SUBREG_REG (dest);
2084
2085   if (GET_CODE (dest) == REG)
2086     record_last_reg_set_info (last_set_insn, REGNO (dest));
2087   else if (GET_CODE (dest) == MEM
2088            /* Ignore pushes, they clobber nothing.  */
2089            && ! push_operand (dest, GET_MODE (dest)))
2090     record_last_mem_set_info (last_set_insn);
2091 }
2092
2093 /* Top level function to create an expression or assignment hash table.
2094
2095    Expression entries are placed in the hash table if
2096    - they are of the form (set (pseudo-reg) src),
2097    - src is something we want to perform GCSE on,
2098    - none of the operands are subsequently modified in the block
2099
2100    Assignment entries are placed in the hash table if
2101    - they are of the form (set (pseudo-reg) src),
2102    - src is something we want to perform const/copy propagation on,
2103    - none of the operands or target are subsequently modified in the block
2104    Currently src must be a pseudo-reg or a const_int.
2105
2106    F is the first insn.
2107    SET_P is non-zero for computing the assignment hash table.  */
2108
2109 static void
2110 compute_hash_table (set_p)
2111      int set_p;
2112 {
2113   int bb;
2114
2115   /* While we compute the hash table we also compute a bit array of which
2116      registers are set in which blocks.
2117      We also compute which blocks set memory, in the absence of aliasing
2118      support [which is TODO].
2119      ??? This isn't needed during const/copy propagation, but it's cheap to
2120      compute.  Later.  */
2121   sbitmap_vector_zero (reg_set_in_block, n_basic_blocks);
2122   bzero ((char *) mem_set_in_block, n_basic_blocks);
2123
2124   /* Some working arrays used to track first and last set in each block.  */
2125   /* ??? One could use alloca here, but at some size a threshold is crossed
2126      beyond which one should use malloc.  Are we at that threshold here?  */
2127   reg_first_set = (int *) gmalloc (max_gcse_regno * sizeof (int));
2128   reg_last_set = (int *) gmalloc (max_gcse_regno * sizeof (int));
2129
2130   for (bb = 0; bb < n_basic_blocks; bb++)
2131     {
2132       rtx insn;
2133       int regno;
2134       int in_libcall_block;
2135       int i;
2136
2137       /* First pass over the instructions records information used to
2138          determine when registers and memory are first and last set.
2139          ??? The mem_set_in_block and hard-reg reg_set_in_block computation
2140          could be moved to compute_sets since they currently don't change.  */
2141
2142       for (i = 0; i < max_gcse_regno; i++)
2143         reg_first_set[i] = reg_last_set[i] = NEVER_SET;
2144       mem_first_set = NEVER_SET;
2145       mem_last_set = NEVER_SET;
2146
2147       for (insn = BLOCK_HEAD (bb);
2148            insn && insn != NEXT_INSN (BLOCK_END (bb));
2149            insn = NEXT_INSN (insn))
2150         {
2151 #ifdef NON_SAVING_SETJMP
2152           if (NON_SAVING_SETJMP && GET_CODE (insn) == NOTE
2153               && NOTE_LINE_NUMBER (insn) == NOTE_INSN_SETJMP)
2154             {
2155               for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
2156                 record_last_reg_set_info (insn, regno);
2157               continue;
2158             }
2159 #endif
2160
2161           if (GET_RTX_CLASS (GET_CODE (insn)) != 'i')
2162             continue;
2163
2164           if (GET_CODE (insn) == CALL_INSN)
2165             {
2166               for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
2167                 if ((call_used_regs[regno]
2168                      && regno != STACK_POINTER_REGNUM
2169 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
2170                      && regno != HARD_FRAME_POINTER_REGNUM
2171 #endif
2172 #if ARG_POINTER_REGNUM != FRAME_POINTER_REGNUM
2173                      && ! (regno == ARG_POINTER_REGNUM && fixed_regs[regno])
2174 #endif
2175 #if defined (PIC_OFFSET_TABLE_REGNUM) && !defined (PIC_OFFSET_TABLE_REG_CALL_CLOBBERED)
2176                      && ! (regno == PIC_OFFSET_TABLE_REGNUM && flag_pic)
2177 #endif
2178
2179                      && regno != FRAME_POINTER_REGNUM)
2180                     || global_regs[regno])
2181                   record_last_reg_set_info (insn, regno);
2182               if (! CONST_CALL_P (insn))
2183                 record_last_mem_set_info (insn);
2184             }
2185
2186           last_set_insn = insn;
2187           note_stores (PATTERN (insn), record_last_set_info);
2188         }
2189
2190       /* The next pass builds the hash table.  */
2191
2192       for (insn = BLOCK_HEAD (bb), in_libcall_block = 0;
2193            insn && insn != NEXT_INSN (BLOCK_END (bb));
2194            insn = NEXT_INSN (insn))
2195         {
2196           if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
2197             {
2198               if (find_reg_note (insn, REG_LIBCALL, NULL_RTX))
2199                 in_libcall_block = 1;
2200               else if (find_reg_note (insn, REG_RETVAL, NULL_RTX))
2201                 in_libcall_block = 0;
2202               hash_scan_insn (insn, set_p, in_libcall_block);
2203             }
2204         }
2205     }
2206
2207   free (reg_first_set);
2208   free (reg_last_set);
2209   /* Catch bugs early.  */
2210   reg_first_set = reg_last_set = 0;
2211 }
2212
2213 /* Allocate space for the set hash table.
2214    N_INSNS is the number of instructions in the function.
2215    It is used to determine the number of buckets to use.  */
2216
2217 static void
2218 alloc_set_hash_table (n_insns)
2219      int n_insns;
2220 {
2221   int n;
2222
2223   set_hash_table_size = n_insns / 4;
2224   if (set_hash_table_size < 11)
2225     set_hash_table_size = 11;
2226   /* Attempt to maintain efficient use of hash table.
2227      Making it an odd number is simplest for now.
2228      ??? Later take some measurements.  */
2229   set_hash_table_size |= 1;
2230   n = set_hash_table_size * sizeof (struct expr *);
2231   set_hash_table = (struct expr **) gmalloc (n);
2232 }
2233
2234 /* Free things allocated by alloc_set_hash_table.  */
2235
2236 static void
2237 free_set_hash_table ()
2238 {
2239   free (set_hash_table);
2240 }
2241
2242 /* Compute the hash table for doing copy/const propagation.  */
2243
2244 static void
2245 compute_set_hash_table ()
2246 {
2247   /* Initialize count of number of entries in hash table.  */
2248   n_sets = 0;
2249   bzero ((char *) set_hash_table, set_hash_table_size * sizeof (struct expr *));
2250
2251   compute_hash_table (1);
2252 }
2253
2254 /* Allocate space for the expression hash table.
2255    N_INSNS is the number of instructions in the function.
2256    It is used to determine the number of buckets to use.  */
2257
2258 static void
2259 alloc_expr_hash_table (n_insns)
2260      int n_insns;
2261 {
2262   int n;
2263
2264   expr_hash_table_size = n_insns / 2;
2265   /* Make sure the amount is usable.  */
2266   if (expr_hash_table_size < 11)
2267     expr_hash_table_size = 11;
2268   /* Attempt to maintain efficient use of hash table.
2269      Making it an odd number is simplest for now.
2270      ??? Later take some measurements.  */
2271   expr_hash_table_size |= 1;
2272   n = expr_hash_table_size * sizeof (struct expr *);
2273   expr_hash_table = (struct expr **) gmalloc (n);
2274 }
2275
2276 /* Free things allocated by alloc_expr_hash_table.  */
2277
2278 static void
2279 free_expr_hash_table ()
2280 {
2281   free (expr_hash_table);
2282 }
2283
2284 /* Compute the hash table for doing GCSE.  */
2285
2286 static void
2287 compute_expr_hash_table ()
2288 {
2289   /* Initialize count of number of entries in hash table.  */
2290   n_exprs = 0;
2291   bzero ((char *) expr_hash_table, expr_hash_table_size * sizeof (struct expr *));
2292
2293   compute_hash_table (0);
2294 }
2295 \f
2296 /* Expression tracking support.  */
2297
2298 /* Lookup pattern PAT in the expression table.
2299    The result is a pointer to the table entry, or NULL if not found.  */
2300
2301 static struct expr *
2302 lookup_expr (pat)
2303      rtx pat;
2304 {
2305   int do_not_record_p;
2306   unsigned int hash = hash_expr (pat, GET_MODE (pat), &do_not_record_p,
2307                                  expr_hash_table_size);
2308   struct expr *expr;
2309
2310   if (do_not_record_p)
2311     return NULL;
2312
2313   expr = expr_hash_table[hash];
2314
2315   while (expr && ! expr_equiv_p (expr->expr, pat))
2316     expr = expr->next_same_hash;
2317
2318   return expr;
2319 }
2320
2321 /* Lookup REGNO in the set table.
2322    If PAT is non-NULL look for the entry that matches it, otherwise return
2323    the first entry for REGNO.
2324    The result is a pointer to the table entry, or NULL if not found.  */
2325
2326 static struct expr *
2327 lookup_set (regno, pat)
2328      int regno;
2329      rtx pat;
2330 {
2331   unsigned int hash = hash_set (regno, set_hash_table_size);
2332   struct expr *expr;
2333
2334   expr = set_hash_table[hash];
2335
2336   if (pat)
2337     {
2338       while (expr && ! expr_equiv_p (expr->expr, pat))
2339         expr = expr->next_same_hash;
2340     }
2341   else
2342     {
2343       while (expr && REGNO (SET_DEST (expr->expr)) != regno)
2344         expr = expr->next_same_hash;
2345     }
2346
2347   return expr;
2348 }
2349
2350 /* Return the next entry for REGNO in list EXPR.  */
2351
2352 static struct expr *
2353 next_set (regno, expr)
2354      int regno;
2355      struct expr *expr;
2356 {
2357   do
2358     expr = expr->next_same_hash;
2359   while (expr && REGNO (SET_DEST (expr->expr)) != regno);
2360   return expr;
2361 }
2362
2363 /* Reset tables used to keep track of what's still available [since the
2364    start of the block].  */
2365
2366 static void
2367 reset_opr_set_tables ()
2368 {
2369   /* Maintain a bitmap of which regs have been set since beginning of
2370      the block.  */
2371   sbitmap_zero (reg_set_bitmap);
2372   /* Also keep a record of the last instruction to modify memory.
2373      For now this is very trivial, we only record whether any memory
2374      location has been modified.  */
2375   mem_last_set = 0;
2376 }
2377
2378 /* Return non-zero if the operands of X are not set before INSN in
2379    INSN's basic block.  */
2380
2381 static int
2382 oprs_not_set_p (x, insn)
2383      rtx x, insn;
2384 {
2385   int i;
2386   enum rtx_code code;
2387   const char *fmt;
2388
2389   /* repeat is used to turn tail-recursion into iteration.  */
2390 repeat:
2391
2392   if (x == 0)
2393     return 1;
2394
2395   code = GET_CODE (x);
2396   switch (code)
2397     {
2398     case PC:
2399     case CC0:
2400     case CONST:
2401     case CONST_INT:
2402     case CONST_DOUBLE:
2403     case SYMBOL_REF:
2404     case LABEL_REF:
2405     case ADDR_VEC:
2406     case ADDR_DIFF_VEC:
2407       return 1;
2408
2409     case MEM:
2410       if (mem_last_set != 0)
2411         return 0;
2412       x = XEXP (x, 0);
2413       goto repeat;
2414
2415     case REG:
2416       return ! TEST_BIT (reg_set_bitmap, REGNO (x));
2417
2418     default:
2419       break;
2420     }
2421
2422   fmt = GET_RTX_FORMAT (code);
2423   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2424     {
2425       if (fmt[i] == 'e')
2426         {
2427           int not_set_p;
2428           /* If we are about to do the last recursive call
2429              needed at this level, change it into iteration.
2430              This function is called enough to be worth it.  */
2431           if (i == 0)
2432             {
2433               x = XEXP (x, 0);
2434               goto repeat;
2435             }
2436           not_set_p = oprs_not_set_p (XEXP (x, i), insn);
2437           if (! not_set_p)
2438             return 0;
2439         }
2440       else if (fmt[i] == 'E')
2441         {
2442           int j;
2443           for (j = 0; j < XVECLEN (x, i); j++)
2444             {
2445               int not_set_p = oprs_not_set_p (XVECEXP (x, i, j), insn);
2446               if (! not_set_p)
2447                 return 0;
2448             }
2449         }
2450     }
2451
2452   return 1;
2453 }
2454
2455 /* Mark things set by a CALL.  */
2456
2457 static void
2458 mark_call (insn)
2459      rtx insn;
2460 {
2461   mem_last_set = INSN_CUID (insn);
2462 }
2463
2464 /* Mark things set by a SET.  */
2465
2466 static void
2467 mark_set (pat, insn)
2468      rtx pat, insn;
2469 {
2470   rtx dest = SET_DEST (pat);
2471
2472   while (GET_CODE (dest) == SUBREG
2473          || GET_CODE (dest) == ZERO_EXTRACT
2474          || GET_CODE (dest) == SIGN_EXTRACT
2475          || GET_CODE (dest) == STRICT_LOW_PART)
2476     dest = XEXP (dest, 0);
2477
2478   if (GET_CODE (dest) == REG)
2479     SET_BIT (reg_set_bitmap, REGNO (dest));
2480   else if (GET_CODE (dest) == MEM)
2481     mem_last_set = INSN_CUID (insn);
2482
2483   if (GET_CODE (SET_SRC (pat)) == CALL)
2484     mark_call (insn);
2485 }
2486
2487 /* Record things set by a CLOBBER.  */
2488
2489 static void
2490 mark_clobber (pat, insn)
2491      rtx pat, insn;
2492 {
2493   rtx clob = XEXP (pat, 0);
2494
2495   while (GET_CODE (clob) == SUBREG || GET_CODE (clob) == STRICT_LOW_PART)
2496     clob = XEXP (clob, 0);
2497
2498   if (GET_CODE (clob) == REG)
2499     SET_BIT (reg_set_bitmap, REGNO (clob));
2500   else
2501     mem_last_set = INSN_CUID (insn);
2502 }
2503
2504 /* Record things set by INSN.
2505    This data is used by oprs_not_set_p.  */
2506
2507 static void
2508 mark_oprs_set (insn)
2509      rtx insn;
2510 {
2511   rtx pat = PATTERN (insn);
2512
2513   if (GET_CODE (pat) == SET)
2514     mark_set (pat, insn);
2515   else if (GET_CODE (pat) == PARALLEL)
2516     {
2517       int i;
2518
2519       for (i = 0; i < XVECLEN (pat, 0); i++)
2520         {
2521           rtx x = XVECEXP (pat, 0, i);
2522
2523           if (GET_CODE (x) == SET)
2524             mark_set (x, insn);
2525           else if (GET_CODE (x) == CLOBBER)
2526             mark_clobber (x, insn);
2527           else if (GET_CODE (x) == CALL)
2528             mark_call (insn);
2529         }
2530     }
2531   else if (GET_CODE (pat) == CLOBBER)
2532     mark_clobber (pat, insn);
2533   else if (GET_CODE (pat) == CALL)
2534     mark_call (insn);
2535 }
2536
2537 \f
2538 /* Classic GCSE reaching definition support.  */
2539
2540 /* Allocate reaching def variables.  */
2541
2542 static void
2543 alloc_rd_mem (n_blocks, n_insns)
2544      int n_blocks, n_insns;
2545 {
2546   rd_kill = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_insns);
2547   sbitmap_vector_zero (rd_kill, n_basic_blocks);
2548
2549   rd_gen = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_insns);
2550   sbitmap_vector_zero (rd_gen, n_basic_blocks);
2551
2552   reaching_defs = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_insns);
2553   sbitmap_vector_zero (reaching_defs, n_basic_blocks);
2554
2555   rd_out = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_insns);
2556   sbitmap_vector_zero (rd_out, n_basic_blocks);
2557 }
2558
2559 /* Free reaching def variables.  */
2560
2561 static void
2562 free_rd_mem ()
2563 {
2564   free (rd_kill);
2565   free (rd_gen);
2566   free (reaching_defs);
2567   free (rd_out);
2568 }
2569
2570 /* Add INSN to the kills of BB.
2571    REGNO, set in BB, is killed by INSN.  */
2572
2573 static void
2574 handle_rd_kill_set (insn, regno, bb)
2575      rtx insn;
2576      int regno, bb;
2577 {
2578   struct reg_set *this_reg = reg_set_table[regno];
2579
2580   while (this_reg)
2581     {
2582       if (BLOCK_NUM (this_reg->insn) != BLOCK_NUM (insn))
2583         SET_BIT (rd_kill[bb], INSN_CUID (this_reg->insn));
2584       this_reg = this_reg->next;
2585     }
2586 }
2587
2588 /* Compute the set of kill's for reaching definitions.  */
2589
2590 static void
2591 compute_kill_rd ()
2592 {
2593   int bb,cuid;
2594
2595   /* For each block
2596        For each set bit in `gen' of the block (i.e each insn which
2597            generates a definition in the block)
2598          Call the reg set by the insn corresponding to that bit regx
2599          Look at the linked list starting at reg_set_table[regx]
2600          For each setting of regx in the linked list, which is not in
2601              this block
2602            Set the bit in `kill' corresponding to that insn
2603     */
2604
2605   for (bb = 0; bb < n_basic_blocks; bb++)
2606     {
2607       for (cuid = 0; cuid < max_cuid; cuid++)
2608         {
2609           if (TEST_BIT (rd_gen[bb], cuid))
2610             {
2611               rtx insn = CUID_INSN (cuid);
2612               rtx pat = PATTERN (insn);
2613
2614               if (GET_CODE (insn) == CALL_INSN)
2615                 {
2616                   int regno;
2617
2618                   for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
2619                     {
2620                       if ((call_used_regs[regno]
2621                            && regno != STACK_POINTER_REGNUM
2622 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
2623                            && regno != HARD_FRAME_POINTER_REGNUM
2624 #endif
2625 #if ARG_POINTER_REGNUM != FRAME_POINTER_REGNUM
2626                            && ! (regno == ARG_POINTER_REGNUM
2627                                  && fixed_regs[regno])
2628 #endif
2629 #if defined (PIC_OFFSET_TABLE_REGNUM) && !defined (PIC_OFFSET_TABLE_REG_CALL_CLOBBERED)
2630                            && ! (regno == PIC_OFFSET_TABLE_REGNUM && flag_pic)
2631 #endif
2632                            && regno != FRAME_POINTER_REGNUM)
2633                           || global_regs[regno])
2634                         handle_rd_kill_set (insn, regno, bb);
2635                     }
2636                 }
2637
2638               if (GET_CODE (pat) == PARALLEL)
2639                 {
2640                   int i;
2641
2642                   /* We work backwards because ... */
2643                   for (i = XVECLEN (pat, 0) - 1; i >= 0; i--)
2644                     {
2645                       enum rtx_code code = GET_CODE (XVECEXP (pat, 0, i));
2646                       if ((code == SET || code == CLOBBER)
2647                           && GET_CODE (XEXP (XVECEXP (pat, 0, i), 0)) == REG)
2648                         handle_rd_kill_set (insn,
2649                                             REGNO (XEXP (XVECEXP (pat, 0, i), 0)),
2650                                             bb);
2651                     }
2652                 }
2653               else if (GET_CODE (pat) == SET)
2654                 {
2655                   if (GET_CODE (SET_DEST (pat)) == REG)
2656                     {
2657                       /* Each setting of this register outside of this block
2658                          must be marked in the set of kills in this block.  */
2659                       handle_rd_kill_set (insn, REGNO (SET_DEST (pat)), bb);
2660                     }
2661                 }
2662               /* FIXME: CLOBBER? */
2663             }
2664         }
2665     }
2666 }
2667
2668 /* Compute the reaching definitions as in
2669    Compilers Principles, Techniques, and Tools. Aho, Sethi, Ullman,
2670    Chapter 10.  It is the same algorithm as used for computing available
2671    expressions but applied to the gens and kills of reaching definitions.  */
2672
2673 static void
2674 compute_rd ()
2675 {
2676   int bb, changed, passes;
2677
2678   for (bb = 0; bb < n_basic_blocks; bb++)
2679     sbitmap_copy (rd_out[bb] /*dst*/, rd_gen[bb] /*src*/);
2680
2681   passes = 0;
2682   changed = 1;
2683   while (changed)
2684     {
2685       changed = 0;
2686       for (bb = 0; bb < n_basic_blocks; bb++)
2687         {
2688           sbitmap_union_of_preds (reaching_defs[bb], rd_out, bb);
2689           changed |= sbitmap_union_of_diff (rd_out[bb], rd_gen[bb],
2690                                             reaching_defs[bb], rd_kill[bb]);
2691         }
2692       passes++;
2693     }
2694
2695   if (gcse_file)
2696     fprintf (gcse_file, "reaching def computation: %d passes\n", passes);
2697 }
2698 \f
2699 /* Classic GCSE available expression support.  */
2700
2701 /* Allocate memory for available expression computation.  */
2702
2703 static void
2704 alloc_avail_expr_mem (n_blocks, n_exprs)
2705      int n_blocks, n_exprs;
2706 {
2707   ae_kill = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_exprs);
2708   sbitmap_vector_zero (ae_kill, n_basic_blocks);
2709
2710   ae_gen = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_exprs);
2711   sbitmap_vector_zero (ae_gen, n_basic_blocks);
2712
2713   ae_in = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_exprs);
2714   sbitmap_vector_zero (ae_in, n_basic_blocks);
2715
2716   ae_out = (sbitmap *) sbitmap_vector_alloc (n_blocks, n_exprs);
2717   sbitmap_vector_zero (ae_out, n_basic_blocks);
2718
2719   u_bitmap = (sbitmap) sbitmap_alloc (n_exprs);
2720   sbitmap_ones (u_bitmap);
2721 }
2722
2723 static void
2724 free_avail_expr_mem ()
2725 {
2726   free (ae_kill);
2727   free (ae_gen);
2728   free (ae_in);
2729   free (ae_out);
2730   free (u_bitmap);
2731 }
2732
2733 /* Compute the set of available expressions generated in each basic block.  */
2734
2735 static void
2736 compute_ae_gen ()
2737 {
2738   int i;
2739
2740   /* For each recorded occurrence of each expression, set ae_gen[bb][expr].
2741      This is all we have to do because an expression is not recorded if it
2742      is not available, and the only expressions we want to work with are the
2743      ones that are recorded.  */
2744
2745   for (i = 0; i < expr_hash_table_size; i++)
2746     {
2747       struct expr *expr = expr_hash_table[i];
2748       while (expr != NULL)
2749         {
2750           struct occr *occr = expr->avail_occr;
2751           while (occr != NULL)
2752             {
2753               SET_BIT (ae_gen[BLOCK_NUM (occr->insn)], expr->bitmap_index);
2754               occr = occr->next;
2755             }
2756           expr = expr->next_same_hash;
2757         }
2758     }
2759 }
2760
2761 /* Return non-zero if expression X is killed in BB.  */
2762
2763 static int
2764 expr_killed_p (x, bb)
2765      rtx x;
2766      int bb;
2767 {
2768   int i;
2769   enum rtx_code code;
2770   const char *fmt;
2771
2772   /* repeat is used to turn tail-recursion into iteration.  */
2773  repeat:
2774
2775   if (x == 0)
2776     return 1;
2777
2778   code = GET_CODE (x);
2779   switch (code)
2780     {
2781     case REG:
2782       return TEST_BIT (reg_set_in_block[bb], REGNO (x));
2783
2784     case MEM:
2785       if (mem_set_in_block[bb])
2786         return 1;
2787       x = XEXP (x, 0);
2788       goto repeat;
2789
2790     case PC:
2791     case CC0: /*FIXME*/
2792     case CONST:
2793     case CONST_INT:
2794     case CONST_DOUBLE:
2795     case SYMBOL_REF:
2796     case LABEL_REF:
2797     case ADDR_VEC:
2798     case ADDR_DIFF_VEC:
2799       return 0;
2800
2801     default:
2802       break;
2803     }
2804
2805   i = GET_RTX_LENGTH (code) - 1;
2806   fmt = GET_RTX_FORMAT (code);
2807   for (; i >= 0; i--)
2808     {
2809       if (fmt[i] == 'e')
2810         {
2811           rtx tem = XEXP (x, i);
2812
2813           /* If we are about to do the last recursive call
2814              needed at this level, change it into iteration.
2815              This function is called enough to be worth it.  */
2816           if (i == 0)
2817             {
2818               x = tem;
2819               goto repeat;
2820             }
2821           if (expr_killed_p (tem, bb))
2822             return 1;
2823         }
2824       else if (fmt[i] == 'E')
2825         {
2826           int j;
2827           for (j = 0; j < XVECLEN (x, i); j++)
2828             {
2829               if (expr_killed_p (XVECEXP (x, i, j), bb))
2830                 return 1;
2831             }
2832         }
2833     }
2834
2835   return 0;
2836 }
2837
2838 /* Compute the set of available expressions killed in each basic block.  */
2839
2840 static void
2841 compute_ae_kill (ae_gen, ae_kill)
2842      sbitmap *ae_gen, *ae_kill;
2843 {
2844   int bb,i;
2845
2846   for (bb = 0; bb < n_basic_blocks; bb++)
2847     {
2848       for (i = 0; i < expr_hash_table_size; i++)
2849         {
2850           struct expr *expr = expr_hash_table[i];
2851
2852           for ( ; expr != NULL; expr = expr->next_same_hash)
2853             {
2854               /* Skip EXPR if generated in this block.  */
2855               if (TEST_BIT (ae_gen[bb], expr->bitmap_index))
2856                 continue;
2857
2858               if (expr_killed_p (expr->expr, bb))
2859                 SET_BIT (ae_kill[bb], expr->bitmap_index);
2860             }
2861         }
2862     }
2863 }
2864 \f
2865 /* Actually perform the Classic GCSE optimizations.  */
2866
2867 /* Return non-zero if occurrence OCCR of expression EXPR reaches block BB.
2868
2869    CHECK_SELF_LOOP is non-zero if we should consider a block reaching itself
2870    as a positive reach.  We want to do this when there are two computations
2871    of the expression in the block.
2872
2873    VISITED is a pointer to a working buffer for tracking which BB's have
2874    been visited.  It is NULL for the top-level call.
2875
2876    We treat reaching expressions that go through blocks containing the same
2877    reaching expression as "not reaching".  E.g. if EXPR is generated in blocks
2878    2 and 3, INSN is in block 4, and 2->3->4, we treat the expression in block
2879    2 as not reaching.  The intent is to improve the probability of finding
2880    only one reaching expression and to reduce register lifetimes by picking
2881    the closest such expression.  */
2882
2883 static int
2884 expr_reaches_here_p (occr, expr, bb, check_self_loop, visited)
2885      struct occr *occr;
2886      struct expr *expr;
2887      int bb;
2888      int check_self_loop;
2889      char *visited;
2890 {
2891   edge pred;
2892
2893   if (visited == NULL)
2894     {
2895       visited = (char *) alloca (n_basic_blocks);
2896       bzero (visited, n_basic_blocks);
2897     }
2898
2899   for (pred = BASIC_BLOCK(bb)->pred; pred != NULL; pred = pred->pred_next)
2900     {
2901       int pred_bb = pred->src->index;
2902
2903       if (visited[pred_bb])
2904         {
2905           /* This predecessor has already been visited.
2906              Nothing to do.  */
2907           ;
2908         }
2909       else if (pred_bb == bb)
2910         {
2911           /* BB loops on itself.  */
2912           if (check_self_loop
2913               && TEST_BIT (ae_gen[pred_bb], expr->bitmap_index)
2914               && BLOCK_NUM (occr->insn) == pred_bb)
2915             return 1;
2916           visited[pred_bb] = 1;
2917         }
2918       /* Ignore this predecessor if it kills the expression.  */
2919       else if (TEST_BIT (ae_kill[pred_bb], expr->bitmap_index))
2920         visited[pred_bb] = 1;
2921       /* Does this predecessor generate this expression?  */
2922       else if (TEST_BIT (ae_gen[pred_bb], expr->bitmap_index))
2923         {
2924           /* Is this the occurrence we're looking for?
2925              Note that there's only one generating occurrence per block
2926              so we just need to check the block number.  */
2927           if (BLOCK_NUM (occr->insn) == pred_bb)
2928             return 1;
2929           visited[pred_bb] = 1;
2930         }
2931       /* Neither gen nor kill.  */
2932       else
2933         {
2934           visited[pred_bb] = 1;
2935           if (expr_reaches_here_p (occr, expr, pred_bb, check_self_loop, visited))
2936             return 1;
2937         }
2938     }
2939
2940   /* All paths have been checked.  */
2941   return 0;
2942 }
2943
2944 /* Return the instruction that computes EXPR that reaches INSN's basic block.
2945    If there is more than one such instruction, return NULL.
2946
2947    Called only by handle_avail_expr.  */
2948
2949 static rtx
2950 computing_insn (expr, insn)
2951      struct expr *expr;
2952      rtx insn;
2953 {
2954   int bb = BLOCK_NUM (insn);
2955
2956   if (expr->avail_occr->next == NULL)
2957     {
2958       if (BLOCK_NUM (expr->avail_occr->insn) == bb)
2959         {
2960           /* The available expression is actually itself
2961              (i.e. a loop in the flow graph) so do nothing.  */
2962           return NULL;
2963         }
2964       /* (FIXME) Case that we found a pattern that was created by
2965          a substitution that took place.  */
2966       return expr->avail_occr->insn;
2967     }
2968   else
2969     {
2970       /* Pattern is computed more than once.
2971          Search backwards from this insn to see how many of these
2972          computations actually reach this insn.  */
2973       struct occr *occr;
2974       rtx insn_computes_expr = NULL;
2975       int can_reach = 0;
2976
2977       for (occr = expr->avail_occr; occr != NULL; occr = occr->next)
2978         {
2979           if (BLOCK_NUM (occr->insn) == bb)
2980             {
2981               /* The expression is generated in this block.
2982                  The only time we care about this is when the expression
2983                  is generated later in the block [and thus there's a loop].
2984                  We let the normal cse pass handle the other cases.  */
2985               if (INSN_CUID (insn) < INSN_CUID (occr->insn))
2986                 {
2987                   if (expr_reaches_here_p (occr, expr, bb, 1, NULL))
2988                     {
2989                       can_reach++;
2990                       if (can_reach > 1)
2991                         return NULL;
2992                       insn_computes_expr = occr->insn;
2993                     }
2994                 }
2995             }
2996           else /* Computation of the pattern outside this block.  */
2997             {
2998               if (expr_reaches_here_p (occr, expr, bb, 0, NULL))
2999                 {
3000                   can_reach++;
3001                   if (can_reach > 1)
3002                     return NULL;
3003                   insn_computes_expr = occr->insn;
3004                 }
3005             }
3006         }
3007
3008       if (insn_computes_expr == NULL)
3009         abort ();
3010       return insn_computes_expr;
3011     }
3012 }
3013
3014 /* Return non-zero if the definition in DEF_INSN can reach INSN.
3015    Only called by can_disregard_other_sets.  */
3016
3017 static int
3018 def_reaches_here_p (insn, def_insn)
3019      rtx insn, def_insn;
3020 {
3021   rtx reg;
3022
3023   if (TEST_BIT (reaching_defs[BLOCK_NUM (insn)], INSN_CUID (def_insn)))
3024     return 1;
3025
3026   if (BLOCK_NUM (insn) == BLOCK_NUM (def_insn))
3027     {
3028       if (INSN_CUID (def_insn) < INSN_CUID (insn))
3029         {
3030           if (GET_CODE (PATTERN (def_insn)) == PARALLEL)
3031             return 1;
3032           if (GET_CODE (PATTERN (def_insn)) == CLOBBER)
3033             reg = XEXP (PATTERN (def_insn), 0);
3034           else if (GET_CODE (PATTERN (def_insn)) == SET)
3035             reg = SET_DEST (PATTERN (def_insn));
3036           else
3037             abort ();
3038           return ! reg_set_between_p (reg, NEXT_INSN (def_insn), insn);
3039         }
3040       else
3041         return 0;
3042     }
3043
3044   return 0;
3045 }
3046
3047 /* Return non-zero if *ADDR_THIS_REG can only have one value at INSN.
3048    The value returned is the number of definitions that reach INSN.
3049    Returning a value of zero means that [maybe] more than one definition
3050    reaches INSN and the caller can't perform whatever optimization it is
3051    trying.  i.e. it is always safe to return zero.  */
3052
3053 static int
3054 can_disregard_other_sets (addr_this_reg, insn, for_combine)
3055      struct reg_set **addr_this_reg;
3056      rtx insn;
3057      int for_combine;
3058 {
3059   int number_of_reaching_defs = 0;
3060   struct reg_set *this_reg = *addr_this_reg;
3061
3062   while (this_reg)
3063     {
3064       if (def_reaches_here_p (insn, this_reg->insn))
3065         {
3066           number_of_reaching_defs++;
3067           /* Ignore parallels for now.  */
3068           if (GET_CODE (PATTERN (this_reg->insn)) == PARALLEL)
3069             return 0;
3070           if (!for_combine
3071               && (GET_CODE (PATTERN (this_reg->insn)) == CLOBBER
3072                   || ! rtx_equal_p (SET_SRC (PATTERN (this_reg->insn)),
3073                                     SET_SRC (PATTERN (insn)))))
3074             {
3075               /* A setting of the reg to a different value reaches INSN.  */
3076               return 0;
3077             }
3078           if (number_of_reaching_defs > 1)
3079             {
3080               /* If in this setting the value the register is being
3081                  set to is equal to the previous value the register
3082                  was set to and this setting reaches the insn we are
3083                  trying to do the substitution on then we are ok.  */
3084
3085               if (GET_CODE (PATTERN (this_reg->insn)) == CLOBBER)
3086                 return 0;
3087               if (! rtx_equal_p (SET_SRC (PATTERN (this_reg->insn)),
3088                                  SET_SRC (PATTERN (insn))))
3089                 return 0;
3090             }
3091           *addr_this_reg = this_reg;
3092         }
3093
3094       /* prev_this_reg = this_reg; */
3095       this_reg = this_reg->next;
3096     }
3097
3098   return number_of_reaching_defs;
3099 }
3100
3101 /* Expression computed by insn is available and the substitution is legal,
3102    so try to perform the substitution.
3103
3104    The result is non-zero if any changes were made.  */
3105
3106 static int
3107 handle_avail_expr (insn, expr)
3108      rtx insn;
3109      struct expr *expr;
3110 {
3111   rtx pat, insn_computes_expr;
3112   rtx to;
3113   struct reg_set *this_reg;
3114   int found_setting, use_src;
3115   int changed = 0;
3116
3117   /* We only handle the case where one computation of the expression
3118      reaches this instruction.  */
3119   insn_computes_expr = computing_insn (expr, insn);
3120   if (insn_computes_expr == NULL)
3121     return 0;
3122
3123   found_setting = 0;
3124   use_src = 0;
3125
3126   /* At this point we know only one computation of EXPR outside of this
3127      block reaches this insn.  Now try to find a register that the
3128      expression is computed into.  */
3129
3130   if (GET_CODE (SET_SRC (PATTERN (insn_computes_expr))) == REG)
3131     {
3132       /* This is the case when the available expression that reaches
3133          here has already been handled as an available expression.  */
3134       int regnum_for_replacing = REGNO (SET_SRC (PATTERN (insn_computes_expr)));
3135       /* If the register was created by GCSE we can't use `reg_set_table',
3136          however we know it's set only once.  */
3137       if (regnum_for_replacing >= max_gcse_regno
3138           /* If the register the expression is computed into is set only once,
3139              or only one set reaches this insn, we can use it.  */
3140           || (((this_reg = reg_set_table[regnum_for_replacing]),
3141                this_reg->next == NULL)
3142               || can_disregard_other_sets (&this_reg, insn, 0)))
3143        {
3144          use_src = 1;
3145          found_setting = 1;
3146        }
3147     }
3148
3149   if (!found_setting)
3150     {
3151       int regnum_for_replacing = REGNO (SET_DEST (PATTERN (insn_computes_expr)));
3152       /* This shouldn't happen.  */
3153       if (regnum_for_replacing >= max_gcse_regno)
3154         abort ();
3155       this_reg = reg_set_table[regnum_for_replacing];
3156       /* If the register the expression is computed into is set only once,
3157          or only one set reaches this insn, use it.  */
3158       if (this_reg->next == NULL
3159           || can_disregard_other_sets (&this_reg, insn, 0))
3160         found_setting = 1;
3161     }
3162
3163   if (found_setting)
3164     {
3165       pat = PATTERN (insn);
3166       if (use_src)
3167         to = SET_SRC (PATTERN (insn_computes_expr));
3168       else
3169         to = SET_DEST (PATTERN (insn_computes_expr));
3170       changed = validate_change (insn, &SET_SRC (pat), to, 0);
3171
3172       /* We should be able to ignore the return code from validate_change but
3173          to play it safe we check.  */
3174       if (changed)
3175         {
3176           gcse_subst_count++;
3177           if (gcse_file != NULL)
3178             {
3179               fprintf (gcse_file, "GCSE: Replacing the source in insn %d with reg %d %s insn %d\n",
3180                        INSN_UID (insn), REGNO (to),
3181                        use_src ? "from" : "set in",
3182                        INSN_UID (insn_computes_expr));
3183             }
3184
3185         }
3186     }
3187   /* The register that the expr is computed into is set more than once.  */
3188   else if (1 /*expensive_op(this_pattrn->op) && do_expensive_gcse)*/)
3189     {
3190       /* Insert an insn after insnx that copies the reg set in insnx
3191          into a new pseudo register call this new register REGN.
3192          From insnb until end of basic block or until REGB is set
3193          replace all uses of REGB with REGN.  */
3194       rtx new_insn;
3195
3196       to = gen_reg_rtx (GET_MODE (SET_DEST (PATTERN (insn_computes_expr))));
3197
3198       /* Generate the new insn.  */
3199       /* ??? If the change fails, we return 0, even though we created
3200          an insn.  I think this is ok.  */
3201       new_insn
3202         = emit_insn_after (gen_rtx_SET (VOIDmode, to,
3203                                         SET_DEST (PATTERN (insn_computes_expr))),
3204                                   insn_computes_expr);
3205       /* Keep block number table up to date.  */
3206       set_block_num (new_insn, BLOCK_NUM (insn_computes_expr));
3207       /* Keep register set table up to date.  */
3208       record_one_set (REGNO (to), new_insn);
3209
3210       gcse_create_count++;
3211       if (gcse_file != NULL)
3212         {
3213           fprintf (gcse_file, "GCSE: Creating insn %d to copy value of reg %d, computed in insn %d,\n",
3214                    INSN_UID (NEXT_INSN (insn_computes_expr)),
3215                    REGNO (SET_SRC (PATTERN (NEXT_INSN (insn_computes_expr)))),
3216                    INSN_UID (insn_computes_expr));
3217           fprintf (gcse_file, "      into newly allocated reg %d\n", REGNO (to));
3218         }
3219
3220       pat = PATTERN (insn);
3221
3222       /* Do register replacement for INSN.  */
3223       changed = validate_change (insn, &SET_SRC (pat),
3224                                  SET_DEST (PATTERN (NEXT_INSN (insn_computes_expr))),
3225                                  0);
3226
3227       /* We should be able to ignore the return code from validate_change but
3228          to play it safe we check.  */
3229       if (changed)
3230         {
3231           gcse_subst_count++;
3232           if (gcse_file != NULL)
3233             {
3234               fprintf (gcse_file, "GCSE: Replacing the source in insn %d with reg %d set in insn %d\n",
3235                        INSN_UID (insn),
3236                        REGNO (SET_DEST (PATTERN (NEXT_INSN (insn_computes_expr)))),
3237                        INSN_UID (insn_computes_expr));
3238             }
3239
3240         }
3241     }
3242
3243   return changed;
3244 }
3245
3246 /* Perform classic GCSE.
3247    This is called by one_classic_gcse_pass after all the dataflow analysis
3248    has been done.
3249
3250    The result is non-zero if a change was made.  */
3251
3252 static int
3253 classic_gcse ()
3254 {
3255   int bb, changed;
3256   rtx insn;
3257
3258   /* Note we start at block 1.  */
3259
3260   changed = 0;
3261   for (bb = 1; bb < n_basic_blocks; bb++)
3262     {
3263       /* Reset tables used to keep track of what's still valid [since the
3264          start of the block].  */
3265       reset_opr_set_tables ();
3266
3267       for (insn = BLOCK_HEAD (bb);
3268            insn != NULL && insn != NEXT_INSN (BLOCK_END (bb));
3269            insn = NEXT_INSN (insn))
3270         {
3271           /* Is insn of form (set (pseudo-reg) ...)?  */
3272
3273           if (GET_CODE (insn) == INSN
3274               && GET_CODE (PATTERN (insn)) == SET
3275               && GET_CODE (SET_DEST (PATTERN (insn))) == REG
3276               && REGNO (SET_DEST (PATTERN (insn))) >= FIRST_PSEUDO_REGISTER)
3277             {
3278               rtx pat = PATTERN (insn);
3279               rtx src = SET_SRC (pat);
3280               struct expr *expr;
3281
3282               if (want_to_gcse_p (src)
3283                   /* Is the expression recorded?  */
3284                   && ((expr = lookup_expr (src)) != NULL)
3285                   /* Is the expression available [at the start of the
3286                      block]?  */
3287                   && TEST_BIT (ae_in[bb], expr->bitmap_index)
3288                   /* Are the operands unchanged since the start of the
3289                      block?  */
3290                   && oprs_not_set_p (src, insn))
3291                 changed |= handle_avail_expr (insn, expr);
3292             }
3293
3294           /* Keep track of everything modified by this insn.  */
3295           /* ??? Need to be careful w.r.t. mods done to INSN.  */
3296           if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
3297             mark_oprs_set (insn);
3298         }
3299     }
3300
3301   return changed;
3302 }
3303
3304 /* Top level routine to perform one classic GCSE pass.
3305
3306    Return non-zero if a change was made.  */
3307
3308 static int
3309 one_classic_gcse_pass (pass)
3310      int pass;
3311 {
3312   int changed = 0;
3313
3314   gcse_subst_count = 0;
3315   gcse_create_count = 0;
3316
3317   alloc_expr_hash_table (max_cuid);
3318   alloc_rd_mem (n_basic_blocks, max_cuid);
3319   compute_expr_hash_table ();
3320   if (gcse_file)
3321     dump_hash_table (gcse_file, "Expression", expr_hash_table,
3322                      expr_hash_table_size, n_exprs);
3323   if (n_exprs > 0)
3324     {
3325       int passes;
3326       compute_kill_rd ();
3327       compute_rd ();
3328       alloc_avail_expr_mem (n_basic_blocks, n_exprs);
3329       compute_ae_gen ();
3330       compute_ae_kill (ae_gen, ae_kill);
3331       passes = compute_available (ae_gen, ae_kill, ae_out, ae_in);
3332       if (gcse_file)
3333         fprintf (gcse_file, "avail expr computation: %d passes\n", passes);
3334       changed = classic_gcse ();
3335       free_avail_expr_mem ();
3336     }
3337   free_rd_mem ();
3338   free_expr_hash_table ();
3339
3340   if (gcse_file)
3341     {
3342       fprintf (gcse_file, "\n");
3343       fprintf (gcse_file, "GCSE of %s, pass %d: %d bytes needed, %d substs, %d insns created\n",
3344                current_function_name, pass,
3345                bytes_used, gcse_subst_count, gcse_create_count);
3346     }
3347
3348   return changed;
3349 }
3350 \f
3351 /* Compute copy/constant propagation working variables.  */
3352
3353 /* Local properties of assignments.  */
3354
3355 static sbitmap *cprop_pavloc;
3356 static sbitmap *cprop_absaltered;
3357
3358 /* Global properties of assignments (computed from the local properties).  */
3359
3360 static sbitmap *cprop_avin;
3361 static sbitmap *cprop_avout;
3362
3363 /* Allocate vars used for copy/const propagation.
3364    N_BLOCKS is the number of basic blocks.
3365    N_SETS is the number of sets.  */
3366
3367 static void
3368 alloc_cprop_mem (n_blocks, n_sets)
3369      int n_blocks, n_sets;
3370 {
3371   cprop_pavloc = sbitmap_vector_alloc (n_blocks, n_sets);
3372   cprop_absaltered = sbitmap_vector_alloc (n_blocks, n_sets);
3373
3374   cprop_avin = sbitmap_vector_alloc (n_blocks, n_sets);
3375   cprop_avout = sbitmap_vector_alloc (n_blocks, n_sets);
3376 }
3377
3378 /* Free vars used by copy/const propagation.  */
3379
3380 static void
3381 free_cprop_mem ()
3382 {
3383   free (cprop_pavloc);
3384   free (cprop_absaltered);
3385   free (cprop_avin);
3386   free (cprop_avout);
3387 }
3388
3389 /* For each block, compute whether X is transparent.
3390    X is either an expression or an assignment [though we don't care which,
3391    for this context an assignment is treated as an expression].
3392    For each block where an element of X is modified, set (SET_P == 1) or reset
3393    (SET_P == 0) the INDX bit in BMAP.  */
3394
3395 static void
3396 compute_transp (x, indx, bmap, set_p)
3397      rtx x;
3398      int indx;
3399      sbitmap *bmap;
3400      int set_p;
3401 {
3402   int bb,i;
3403   enum rtx_code code;
3404   const char *fmt;
3405
3406   /* repeat is used to turn tail-recursion into iteration.  */
3407  repeat:
3408
3409   if (x == 0)
3410     return;
3411
3412   code = GET_CODE (x);
3413   switch (code)
3414     {
3415     case REG:
3416       {
3417         reg_set *r;
3418         int regno = REGNO (x);
3419
3420         if (set_p)
3421           {
3422             if (regno < FIRST_PSEUDO_REGISTER)
3423               {
3424                 for (bb = 0; bb < n_basic_blocks; bb++)
3425                   if (TEST_BIT (reg_set_in_block[bb], regno))
3426                     SET_BIT (bmap[bb], indx);
3427               }
3428             else
3429               {
3430                 for (r = reg_set_table[regno]; r != NULL; r = r->next)
3431                   {
3432                     bb = BLOCK_NUM (r->insn);
3433                     SET_BIT (bmap[bb], indx);
3434                   }
3435               }
3436           }
3437         else
3438           {
3439             if (regno < FIRST_PSEUDO_REGISTER)
3440               {
3441                 for (bb = 0; bb < n_basic_blocks; bb++)
3442                   if (TEST_BIT (reg_set_in_block[bb], regno))
3443                     RESET_BIT (bmap[bb], indx);
3444               }
3445             else
3446               {
3447                 for (r = reg_set_table[regno]; r != NULL; r = r->next)
3448                   {
3449                     bb = BLOCK_NUM (r->insn);
3450                     RESET_BIT (bmap[bb], indx);
3451                   }
3452               }
3453           }
3454         return;
3455       }
3456
3457     case MEM:
3458       if (set_p)
3459         {
3460           for (bb = 0; bb < n_basic_blocks; bb++)
3461             if (mem_set_in_block[bb])
3462               SET_BIT (bmap[bb], indx);
3463         }
3464       else
3465         {
3466           for (bb = 0; bb < n_basic_blocks; bb++)
3467             if (mem_set_in_block[bb])
3468               RESET_BIT (bmap[bb], indx);
3469         }
3470       x = XEXP (x, 0);
3471       goto repeat;
3472
3473     case PC:
3474     case CC0: /*FIXME*/
3475     case CONST:
3476     case CONST_INT:
3477     case CONST_DOUBLE:
3478     case SYMBOL_REF:
3479     case LABEL_REF:
3480     case ADDR_VEC:
3481     case ADDR_DIFF_VEC:
3482       return;
3483
3484     default:
3485       break;
3486     }
3487
3488   i = GET_RTX_LENGTH (code) - 1;
3489   fmt = GET_RTX_FORMAT (code);
3490   for (; i >= 0; i--)
3491     {
3492       if (fmt[i] == 'e')
3493         {
3494           rtx tem = XEXP (x, i);
3495
3496           /* If we are about to do the last recursive call
3497              needed at this level, change it into iteration.
3498              This function is called enough to be worth it.  */
3499           if (i == 0)
3500             {
3501               x = tem;
3502               goto repeat;
3503             }
3504           compute_transp (tem, indx, bmap, set_p);
3505         }
3506       else if (fmt[i] == 'E')
3507         {
3508           int j;
3509           for (j = 0; j < XVECLEN (x, i); j++)
3510             compute_transp (XVECEXP (x, i, j), indx, bmap, set_p);
3511         }
3512     }
3513 }
3514
3515 /* Compute the available expressions at the start and end of each
3516    basic block for cprop.  This particular dataflow equation is
3517    used often enough that we might want to generalize it and make
3518    as a subroutine for other global optimizations that need available
3519    in/out information.  */
3520 static void
3521 compute_cprop_avinout ()
3522 {
3523   int bb, changed, passes;
3524
3525   sbitmap_zero (cprop_avin[0]);
3526   sbitmap_vector_ones (cprop_avout, n_basic_blocks);
3527
3528   passes = 0;
3529   changed = 1;
3530   while (changed)
3531     {
3532       changed = 0;
3533       for (bb = 0; bb < n_basic_blocks; bb++)
3534         {
3535           if (bb != 0)
3536             sbitmap_intersection_of_preds (cprop_avin[bb], cprop_avout, bb);
3537           changed |= sbitmap_union_of_diff (cprop_avout[bb],
3538                                             cprop_pavloc[bb],
3539                                             cprop_avin[bb],
3540                                             cprop_absaltered[bb]);
3541         }
3542       passes++;
3543     }
3544
3545   if (gcse_file)
3546     fprintf (gcse_file, "cprop avail expr computation: %d passes\n", passes);
3547 }
3548
3549 /* Top level routine to do the dataflow analysis needed by copy/const
3550    propagation.  */
3551
3552 static void
3553 compute_cprop_data ()
3554 {
3555   compute_local_properties (cprop_absaltered, cprop_pavloc, NULL, 1);
3556   compute_cprop_avinout ();
3557 }
3558 \f
3559 /* Copy/constant propagation.  */
3560
3561 /* Maximum number of register uses in an insn that we handle.  */
3562 #define MAX_USES 8
3563
3564 /* Table of uses found in an insn.
3565    Allocated statically to avoid alloc/free complexity and overhead.  */
3566 static struct reg_use reg_use_table[MAX_USES];
3567
3568 /* Index into `reg_use_table' while building it.  */
3569 static int reg_use_count;
3570
3571 /* Set up a list of register numbers used in INSN.
3572    The found uses are stored in `reg_use_table'.
3573    `reg_use_count' is initialized to zero before entry, and
3574    contains the number of uses in the table upon exit.
3575
3576    ??? If a register appears multiple times we will record it multiple
3577    times.  This doesn't hurt anything but it will slow things down.  */
3578
3579 static void
3580 find_used_regs (x)
3581      rtx x;
3582 {
3583   int i;
3584   enum rtx_code code;
3585   const char *fmt;
3586
3587   /* repeat is used to turn tail-recursion into iteration.  */
3588  repeat:
3589
3590   if (x == 0)
3591     return;
3592
3593   code = GET_CODE (x);
3594   switch (code)
3595     {
3596     case REG:
3597       if (reg_use_count == MAX_USES)
3598         return;
3599       reg_use_table[reg_use_count].reg_rtx = x;
3600       reg_use_count++;
3601       return;
3602
3603     case MEM:
3604       x = XEXP (x, 0);
3605       goto repeat;
3606
3607     case PC:
3608     case CC0:
3609     case CONST:
3610     case CONST_INT:
3611     case CONST_DOUBLE:
3612     case SYMBOL_REF:
3613     case LABEL_REF:
3614     case CLOBBER:
3615     case ADDR_VEC:
3616     case ADDR_DIFF_VEC:
3617     case ASM_INPUT: /*FIXME*/
3618       return;
3619
3620     case SET:
3621       if (GET_CODE (SET_DEST (x)) == MEM)
3622         find_used_regs (SET_DEST (x));
3623       x = SET_SRC (x);
3624       goto repeat;
3625
3626     default:
3627       break;
3628     }
3629
3630   /* Recursively scan the operands of this expression.  */
3631
3632   fmt = GET_RTX_FORMAT (code);
3633   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3634     {
3635       if (fmt[i] == 'e')
3636         {
3637           /* If we are about to do the last recursive call
3638              needed at this level, change it into iteration.
3639              This function is called enough to be worth it.  */
3640           if (i == 0)
3641             {
3642               x = XEXP (x, 0);
3643               goto repeat;
3644             }
3645           find_used_regs (XEXP (x, i));
3646         }
3647       else if (fmt[i] == 'E')
3648         {
3649           int j;
3650           for (j = 0; j < XVECLEN (x, i); j++)
3651             find_used_regs (XVECEXP (x, i, j));
3652         }
3653     }
3654 }
3655
3656 /* Try to replace all non-SET_DEST occurrences of FROM in INSN with TO.
3657    Returns non-zero is successful.  */
3658
3659 static int
3660 try_replace_reg (from, to, insn)
3661      rtx from, to, insn;
3662 {
3663   /* If this fails we could try to simplify the result of the
3664      replacement and attempt to recognize the simplified insn.
3665
3666      But we need a general simplify_rtx that doesn't have pass
3667      specific state variables.  I'm not aware of one at the moment.  */
3668   return validate_replace_src (from, to, insn);
3669 }
3670
3671 /* Find a set of REGNO that is available on entry to INSN's block.
3672    Returns NULL if not found.  */
3673
3674 static struct expr *
3675 find_avail_set (regno, insn)
3676      int regno;
3677      rtx insn;
3678 {
3679   /* SET1 contains the last set found that can be returned to the caller for
3680      use in a substitution.  */
3681   struct expr *set1 = 0;
3682
3683   /* Loops are not possible here.  To get a loop we would need two sets
3684      available at the start of the block containing INSN.  ie we would
3685      need two sets like this available at the start of the block:
3686
3687        (set (reg X) (reg Y))
3688        (set (reg Y) (reg X))
3689
3690      This can not happen since the set of (reg Y) would have killed the
3691      set of (reg X) making it unavailable at the start of this block.  */
3692   while (1)
3693      {
3694       rtx src;
3695       struct expr *set = lookup_set (regno, NULL_RTX);
3696
3697       /* Find a set that is available at the start of the block
3698          which contains INSN.  */
3699       while (set)
3700         {
3701           if (TEST_BIT (cprop_avin[BLOCK_NUM (insn)], set->bitmap_index))
3702             break;
3703           set = next_set (regno, set);
3704         }
3705
3706       /* If no available set was found we've reached the end of the
3707          (possibly empty) copy chain.  */
3708       if (set == 0)
3709         break;
3710
3711       if (GET_CODE (set->expr) != SET)
3712         abort ();
3713
3714       src = SET_SRC (set->expr);
3715
3716       /* We know the set is available.
3717          Now check that SRC is ANTLOC (i.e. none of the source operands
3718          have changed since the start of the block).
3719
3720          If the source operand changed, we may still use it for the next
3721          iteration of this loop, but we may not use it for substitutions.  */
3722       if (CONSTANT_P (src) || oprs_not_set_p (src, insn))
3723         set1 = set;
3724
3725       /* If the source of the set is anything except a register, then
3726          we have reached the end of the copy chain.  */
3727       if (GET_CODE (src) != REG)
3728         break;
3729
3730       /* Follow the copy chain, ie start another iteration of the loop
3731          and see if we have an available copy into SRC.  */
3732       regno = REGNO (src);
3733      }
3734
3735   /* SET1 holds the last set that was available and anticipatable at
3736      INSN.  */
3737   return set1;
3738 }
3739
3740 /* Subroutine of cprop_insn that tries to propagate constants into
3741    JUMP_INSNS.  INSN must be a conditional jump; COPY is a copy of it
3742    that we can use for substitutions.
3743    REG_USED is the use we will try to replace, SRC is the constant we
3744    will try to substitute for it.
3745    Returns nonzero if a change was made.  */
3746 static int
3747 cprop_jump (insn, copy, reg_used, src)
3748      rtx insn, copy;
3749      struct reg_use *reg_used;
3750      rtx src;
3751 {
3752   rtx set = PATTERN (copy);
3753   rtx temp;
3754
3755   /* Replace the register with the appropriate constant.  */
3756   replace_rtx (SET_SRC (set), reg_used->reg_rtx, src);
3757
3758   temp = simplify_ternary_operation (GET_CODE (SET_SRC (set)),
3759                                      GET_MODE (SET_SRC (set)),
3760                                      GET_MODE (XEXP (SET_SRC (set), 0)),
3761                                      XEXP (SET_SRC (set), 0),
3762                                      XEXP (SET_SRC (set), 1),
3763                                      XEXP (SET_SRC (set), 2));
3764
3765   /* If no simplification can be made, then try the next
3766      register.  */
3767   if (temp == 0)
3768     return 0;
3769
3770   SET_SRC (set) = temp;
3771
3772   /* That may have changed the structure of TEMP, so
3773      force it to be rerecognized if it has not turned
3774      into a nop or unconditional jump.  */
3775
3776   INSN_CODE (copy) = -1;
3777   if ((SET_DEST (set) == pc_rtx
3778        && (SET_SRC (set) == pc_rtx
3779            || GET_CODE (SET_SRC (set)) == LABEL_REF))
3780       || recog (PATTERN (copy), copy, NULL) >= 0)
3781     {
3782       /* This has either become an unconditional jump
3783          or a nop-jump.  We'd like to delete nop jumps
3784          here, but doing so confuses gcse.  So we just
3785          make the replacement and let later passes
3786          sort things out.  */
3787       PATTERN (insn) = set;
3788       INSN_CODE (insn) = -1;
3789
3790       /* One less use of the label this insn used to jump to
3791          if we turned this into a NOP jump.  */
3792       if (SET_SRC (set) == pc_rtx && JUMP_LABEL (insn) != 0)
3793         --LABEL_NUSES (JUMP_LABEL (insn));
3794
3795       /* If this has turned into an unconditional jump,
3796          then put a barrier after it so that the unreachable
3797          code will be deleted.  */
3798       if (GET_CODE (SET_SRC (set)) == LABEL_REF)
3799         emit_barrier_after (insn);
3800
3801       run_jump_opt_after_gcse = 1;
3802
3803       const_prop_count++;
3804       if (gcse_file != NULL)
3805         {
3806           int regno = REGNO (reg_used->reg_rtx);
3807           fprintf (gcse_file, "CONST-PROP: Replacing reg %d in insn %d with constant ",
3808                    regno, INSN_UID (insn));
3809           print_rtl (gcse_file, src);
3810           fprintf (gcse_file, "\n");
3811         }
3812       return 1;
3813     }
3814   return 0;
3815 }
3816
3817 #ifdef HAVE_cc0
3818 /* Subroutine of cprop_insn that tries to propagate constants into
3819    JUMP_INSNS for machines that have CC0.  INSN is a single set that
3820    stores into CC0; the insn following it is a conditional jump.
3821    REG_USED is the use we will try to replace, SRC is the constant we
3822    will try to substitute for it.
3823    Returns nonzero if a change was made.  */
3824 static int
3825 cprop_cc0_jump (insn, reg_used, src)
3826      rtx insn;
3827      struct reg_use *reg_used;
3828      rtx src;
3829 {
3830   rtx jump = NEXT_INSN (insn);
3831   rtx copy = copy_rtx (jump);
3832   rtx set = PATTERN (copy);
3833
3834   /* We need to copy the source of the cc0 setter, as cprop_jump is going to
3835      substitute into it.  */
3836   replace_rtx (SET_SRC (set), cc0_rtx, copy_rtx (SET_SRC (PATTERN (insn))));
3837   if (! cprop_jump (jump, copy, reg_used, src))
3838     return 0;
3839
3840   /* If we succeeded, delete the cc0 setter.  */
3841   PUT_CODE (insn, NOTE);
3842   NOTE_LINE_NUMBER (insn) = NOTE_INSN_DELETED;
3843   NOTE_SOURCE_FILE (insn) = 0;
3844   return 1;
3845  }
3846 #endif
3847
3848 /* Perform constant and copy propagation on INSN.
3849    The result is non-zero if a change was made.  */
3850
3851 static int
3852 cprop_insn (insn, alter_jumps)
3853      rtx insn;
3854      int alter_jumps;
3855 {
3856   struct reg_use *reg_used;
3857   int changed = 0;
3858
3859   /* Only propagate into SETs.  Note that a conditional jump is a
3860      SET with pc_rtx as the destination.  */
3861   if ((GET_CODE (insn) != INSN
3862        && GET_CODE (insn) != JUMP_INSN)
3863       || GET_CODE (PATTERN (insn)) != SET)
3864     return 0;
3865
3866   reg_use_count = 0;
3867   find_used_regs (PATTERN (insn));
3868
3869   reg_used = &reg_use_table[0];
3870   for ( ; reg_use_count > 0; reg_used++, reg_use_count--)
3871     {
3872       rtx pat, src;
3873       struct expr *set;
3874       int regno = REGNO (reg_used->reg_rtx);
3875
3876       /* Ignore registers created by GCSE.
3877          We do this because ... */
3878       if (regno >= max_gcse_regno)
3879         continue;
3880
3881       /* If the register has already been set in this block, there's
3882          nothing we can do.  */
3883       if (! oprs_not_set_p (reg_used->reg_rtx, insn))
3884         continue;
3885
3886       /* Find an assignment that sets reg_used and is available
3887          at the start of the block.  */
3888       set = find_avail_set (regno, insn);
3889       if (! set)
3890         continue;
3891
3892       pat = set->expr;
3893       /* ??? We might be able to handle PARALLELs.  Later.  */
3894       if (GET_CODE (pat) != SET)
3895         abort ();
3896       src = SET_SRC (pat);
3897
3898       /* Constant propagation.  */
3899       if (GET_CODE (src) == CONST_INT || GET_CODE (src) == CONST_DOUBLE
3900           || GET_CODE (src) == SYMBOL_REF)
3901         {
3902           /* Handle normal insns first.  */
3903           if (GET_CODE (insn) == INSN
3904               && try_replace_reg (reg_used->reg_rtx, src, insn))
3905             {
3906               changed = 1;
3907               const_prop_count++;
3908               if (gcse_file != NULL)
3909                 {
3910                   fprintf (gcse_file, "CONST-PROP: Replacing reg %d in insn %d with constant ",
3911                            regno, INSN_UID (insn));
3912                   print_rtl (gcse_file, src);
3913                   fprintf (gcse_file, "\n");
3914                 }
3915
3916               /* The original insn setting reg_used may or may not now be
3917                  deletable.  We leave the deletion to flow.  */
3918             }
3919
3920           /* Try to propagate a CONST_INT into a conditional jump.
3921              We're pretty specific about what we will handle in this
3922              code, we can extend this as necessary over time.
3923
3924              Right now the insn in question must look like
3925              (set (pc) (if_then_else ...))  */
3926           else if (alter_jumps
3927                    && GET_CODE (insn) == JUMP_INSN
3928                    && condjump_p (insn)
3929                    && ! simplejump_p (insn))
3930             changed |= cprop_jump (insn, copy_rtx (insn), reg_used, src);
3931 #ifdef HAVE_cc0
3932           /* Similar code for machines that use a pair of CC0 setter and
3933              conditional jump insn.  */
3934           else if (alter_jumps
3935                    && GET_CODE (PATTERN (insn)) == SET
3936                    && SET_DEST (PATTERN (insn)) == cc0_rtx
3937                    && GET_CODE (NEXT_INSN (insn)) == JUMP_INSN
3938                    && condjump_p (NEXT_INSN (insn))
3939                    && ! simplejump_p (NEXT_INSN (insn)))
3940             changed |= cprop_cc0_jump (insn, reg_used, src);
3941 #endif
3942         }
3943       else if (GET_CODE (src) == REG
3944                && REGNO (src) >= FIRST_PSEUDO_REGISTER
3945                && REGNO (src) != regno)
3946         {
3947           if (try_replace_reg (reg_used->reg_rtx, src, insn))
3948             {
3949               changed = 1;
3950               copy_prop_count++;
3951               if (gcse_file != NULL)
3952                 {
3953                   fprintf (gcse_file, "COPY-PROP: Replacing reg %d in insn %d with reg %d\n",
3954                            regno, INSN_UID (insn), REGNO (src));
3955                 }
3956
3957               /* The original insn setting reg_used may or may not now be
3958                  deletable.  We leave the deletion to flow.  */
3959               /* FIXME: If it turns out that the insn isn't deletable,
3960                  then we may have unnecessarily extended register lifetimes
3961                  and made things worse.  */
3962             }
3963         }
3964     }
3965
3966   return changed;
3967 }
3968
3969 /* Forward propagate copies.
3970    This includes copies and constants.
3971    Return non-zero if a change was made.  */
3972
3973 static int
3974 cprop (alter_jumps)
3975      int alter_jumps;
3976 {
3977   int bb, changed;
3978   rtx insn;
3979
3980   /* Note we start at block 1.  */
3981
3982   changed = 0;
3983   for (bb = 1; bb < n_basic_blocks; bb++)
3984     {
3985       /* Reset tables used to keep track of what's still valid [since the
3986          start of the block].  */
3987       reset_opr_set_tables ();
3988
3989       for (insn = BLOCK_HEAD (bb);
3990            insn != NULL && insn != NEXT_INSN (BLOCK_END (bb));
3991            insn = NEXT_INSN (insn))
3992         {
3993           if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
3994             {
3995               changed |= cprop_insn (insn, alter_jumps);
3996
3997               /* Keep track of everything modified by this insn.  */
3998               /* ??? Need to be careful w.r.t. mods done to INSN.  Don't
3999                  call mark_oprs_set if we turned the insn into a NOTE.  */
4000               if (GET_CODE (insn) != NOTE)
4001                 mark_oprs_set (insn);
4002             }
4003         }
4004     }
4005
4006   if (gcse_file != NULL)
4007     fprintf (gcse_file, "\n");
4008
4009   return changed;
4010 }
4011
4012 /* Perform one copy/constant propagation pass.
4013    F is the first insn in the function.
4014    PASS is the pass count.  */
4015
4016 static int
4017 one_cprop_pass (pass, alter_jumps)
4018      int pass;
4019      int alter_jumps;
4020 {
4021   int changed = 0;
4022
4023   const_prop_count = 0;
4024   copy_prop_count = 0;
4025
4026   alloc_set_hash_table (max_cuid);
4027   compute_set_hash_table ();
4028   if (gcse_file)
4029     dump_hash_table (gcse_file, "SET", set_hash_table, set_hash_table_size,
4030                      n_sets);
4031   if (n_sets > 0)
4032     {
4033       alloc_cprop_mem (n_basic_blocks, n_sets);
4034       compute_cprop_data ();
4035       changed = cprop (alter_jumps);
4036       free_cprop_mem ();
4037     }
4038   free_set_hash_table ();
4039
4040   if (gcse_file)
4041     {
4042       fprintf (gcse_file, "CPROP of %s, pass %d: %d bytes needed, %d const props, %d copy props\n",
4043                current_function_name, pass,
4044                bytes_used, const_prop_count, copy_prop_count);
4045       fprintf (gcse_file, "\n");
4046     }
4047
4048   return changed;
4049 }
4050 \f
4051 /* Compute PRE+LCM working variables.  */
4052
4053 /* Local properties of expressions.  */
4054 /* Nonzero for expressions that are transparent in the block.  */
4055 static sbitmap *transp;
4056
4057 /* Nonzero for expressions that are transparent at the end of the block.
4058    This is only zero for expressions killed by abnormal critical edge
4059    created by a calls.  */
4060 static sbitmap *transpout;
4061
4062 /* Nonzero for expressions that are computed (available) in the block.  */
4063 static sbitmap *comp;
4064
4065 /* Nonzero for expressions that are locally anticipatable in the block.  */
4066 static sbitmap *antloc;
4067
4068 /* Nonzero for expressions where this block is an optimal computation
4069    point.  */
4070 static sbitmap *pre_optimal;
4071
4072 /* Nonzero for expressions which are redundant in a particular block.  */
4073 static sbitmap *pre_redundant;
4074
4075 /* Nonzero for expressions which should be inserted on a specific edge.  */
4076 static sbitmap *pre_insert_map;
4077
4078 /* Nonzero for expressions which should be deleted in a specific block.  */
4079 static sbitmap *pre_delete_map;
4080
4081 /* Contains the edge_list returned by pre_edge_lcm.  */
4082 static struct edge_list *edge_list;
4083
4084 static sbitmap *temp_bitmap;
4085
4086 /* Redundant insns.  */
4087 static sbitmap pre_redundant_insns;
4088
4089 /* Allocate vars used for PRE analysis.  */
4090
4091 static void
4092 alloc_pre_mem (n_blocks, n_exprs)
4093      int n_blocks, n_exprs;
4094 {
4095   transp = sbitmap_vector_alloc (n_blocks, n_exprs);
4096   comp = sbitmap_vector_alloc (n_blocks, n_exprs);
4097   antloc = sbitmap_vector_alloc (n_blocks, n_exprs);
4098
4099   temp_bitmap = sbitmap_vector_alloc (n_blocks, n_exprs);
4100   pre_optimal = NULL;
4101   pre_redundant = NULL;
4102   pre_insert_map = NULL;
4103   pre_delete_map = NULL;
4104   ae_in = NULL;
4105   ae_out = NULL;
4106   u_bitmap = NULL;
4107   transpout = sbitmap_vector_alloc (n_blocks, n_exprs);
4108   ae_kill = sbitmap_vector_alloc (n_blocks, n_exprs);
4109   /* pre_insert and pre_delete are allocated later.  */
4110 }
4111
4112 /* Free vars used for PRE analysis.  */
4113
4114 static void
4115 free_pre_mem ()
4116 {
4117   free (transp);
4118   free (comp);
4119   free (antloc);
4120
4121   if (pre_optimal)
4122     free (pre_optimal);
4123   if (pre_redundant)
4124     free (pre_redundant);
4125   if (pre_insert_map)
4126     free (pre_insert_map);
4127   if (pre_delete_map)
4128     free (pre_delete_map);
4129   if (transpout)
4130     free (transpout);
4131
4132   if (ae_in)
4133     free (ae_in);
4134   if (ae_out)
4135     free (ae_out);
4136   if (ae_kill)
4137     free (ae_kill);
4138   if (u_bitmap)
4139     free (u_bitmap);
4140
4141   transp = comp = antloc = NULL;
4142   pre_optimal = pre_redundant = pre_insert_map = pre_delete_map = NULL;
4143   transpout = ae_in = ae_out = ae_kill = NULL;
4144   u_bitmap = NULL;
4145
4146 }
4147
4148 /* Top level routine to do the dataflow analysis needed by PRE.  */
4149
4150 static void
4151 compute_pre_data ()
4152 {
4153   compute_local_properties (transp, comp, antloc, 0);
4154   compute_transpout ();
4155   sbitmap_vector_zero (ae_kill, n_basic_blocks);
4156   compute_ae_kill (comp, ae_kill);
4157   edge_list = pre_edge_lcm (gcse_file, n_exprs, transp, comp, antloc,
4158                             ae_kill, &pre_insert_map, &pre_delete_map);
4159 }
4160
4161 \f
4162 /* PRE utilities */
4163
4164 /* Return non-zero if an occurrence of expression EXPR in OCCR_BB would reach
4165    block BB.
4166
4167    VISITED is a pointer to a working buffer for tracking which BB's have
4168    been visited.  It is NULL for the top-level call.
4169
4170    CHECK_PRE_COMP controls whether or not we check for a computation of
4171    EXPR in OCCR_BB.
4172
4173    We treat reaching expressions that go through blocks containing the same
4174    reaching expression as "not reaching".  E.g. if EXPR is generated in blocks
4175    2 and 3, INSN is in block 4, and 2->3->4, we treat the expression in block
4176    2 as not reaching.  The intent is to improve the probability of finding
4177    only one reaching expression and to reduce register lifetimes by picking
4178    the closest such expression.  */
4179
4180 static int
4181 pre_expr_reaches_here_p (occr_bb, expr, bb, check_pre_comp, visited)
4182      int occr_bb;
4183      struct expr *expr;
4184      int bb;
4185      int check_pre_comp;
4186      char *visited;
4187 {
4188   edge pred;
4189
4190   if (visited == NULL)
4191     {
4192       visited = (char *) alloca (n_basic_blocks);
4193       bzero (visited, n_basic_blocks);
4194     }
4195
4196   for (pred = BASIC_BLOCK (bb)->pred; pred != NULL; pred = pred->pred_next)
4197     {
4198       int pred_bb = pred->src->index;
4199
4200       if (pred->src == ENTRY_BLOCK_PTR
4201           /* Has predecessor has already been visited?  */
4202           || visited[pred_bb])
4203         {
4204           /* Nothing to do.  */
4205         }
4206       /* Does this predecessor generate this expression?  */
4207       else if ((!check_pre_comp && occr_bb == pred_bb)
4208                || TEST_BIT (comp[pred_bb], expr->bitmap_index))
4209         {
4210           /* Is this the occurrence we're looking for?
4211              Note that there's only one generating occurrence per block
4212              so we just need to check the block number.  */
4213           if (occr_bb == pred_bb)
4214             return 1;
4215           visited[pred_bb] = 1;
4216         }
4217       /* Ignore this predecessor if it kills the expression.  */
4218       else if (! TEST_BIT (transp[pred_bb], expr->bitmap_index))
4219         visited[pred_bb] = 1;
4220       /* Neither gen nor kill.  */
4221       else
4222         {
4223           visited[pred_bb] = 1;
4224           if (pre_expr_reaches_here_p (occr_bb, expr, pred_bb,
4225                                        check_pre_comp, visited))
4226             return 1;
4227         }
4228     }
4229
4230   /* All paths have been checked.  */
4231   return 0;
4232 }
4233 \f
4234
4235 /* Given an expr, generate RTL which we can insert at the end of a BB,
4236    or on an edge.  Set the block number of any insns generated to
4237    the value of BB.  */
4238
4239 static rtx
4240 process_insert_insn (expr)
4241      struct expr *expr;
4242 {
4243   rtx reg = expr->reaching_reg;
4244   rtx pat, copied_expr;
4245   rtx first_new_insn;
4246
4247   start_sequence ();
4248   copied_expr = copy_rtx (expr->expr);
4249   emit_move_insn (reg, copied_expr);
4250   first_new_insn = get_insns ();
4251   pat = gen_sequence ();
4252   end_sequence ();
4253
4254   return pat;
4255 }
4256
4257 /* Add EXPR to the end of basic block BB.
4258
4259    This is used by both the PRE and code hoisting.
4260
4261    For PRE, we want to verify that the expr is either transparent
4262    or locally anticipatable in the target block.  This check makes
4263    no sense for code hoisting.  */
4264
4265 static void
4266 insert_insn_end_bb (expr, bb, pre)
4267      struct expr *expr;
4268      int bb;
4269      int pre;
4270 {
4271   rtx insn = BLOCK_END (bb);
4272   rtx new_insn;
4273   rtx reg = expr->reaching_reg;
4274   int regno = REGNO (reg);
4275   rtx pat;
4276
4277   pat = process_insert_insn (expr);
4278
4279   /* If the last insn is a jump, insert EXPR in front [taking care to
4280      handle cc0, etc. properly].  */
4281
4282   if (GET_CODE (insn) == JUMP_INSN)
4283     {
4284 #ifdef HAVE_cc0
4285       rtx note;
4286 #endif
4287
4288       /* If this is a jump table, then we can't insert stuff here.  Since
4289          we know the previous real insn must be the tablejump, we insert
4290          the new instruction just before the tablejump.  */
4291       if (GET_CODE (PATTERN (insn)) == ADDR_VEC
4292           || GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC)
4293         insn = prev_real_insn (insn);
4294
4295 #ifdef HAVE_cc0
4296       /* FIXME: 'twould be nice to call prev_cc0_setter here but it aborts
4297          if cc0 isn't set.  */
4298       note = find_reg_note (insn, REG_CC_SETTER, NULL_RTX);
4299       if (note)
4300         insn = XEXP (note, 0);
4301       else
4302         {
4303           rtx maybe_cc0_setter = prev_nonnote_insn (insn);
4304           if (maybe_cc0_setter
4305               && GET_RTX_CLASS (GET_CODE (maybe_cc0_setter)) == 'i'
4306               && sets_cc0_p (PATTERN (maybe_cc0_setter)))
4307             insn = maybe_cc0_setter;
4308         }
4309 #endif
4310       /* FIXME: What if something in cc0/jump uses value set in new insn?  */
4311       new_insn = emit_insn_before (pat, insn);
4312       if (BLOCK_HEAD (bb) == insn)
4313         BLOCK_HEAD (bb) = new_insn;
4314     }
4315   /* Likewise if the last insn is a call, as will happen in the presence
4316      of exception handling.  */
4317   else if (GET_CODE (insn) == CALL_INSN)
4318     {
4319       HARD_REG_SET parm_regs;
4320       int nparm_regs;
4321       rtx p;
4322
4323       /* Keeping in mind SMALL_REGISTER_CLASSES and parameters in registers,
4324          we search backward and place the instructions before the first
4325          parameter is loaded.  Do this for everyone for consistency and a
4326          presumtion that we'll get better code elsewhere as well.  */
4327
4328       /* It should always be the case that we can put these instructions
4329          anywhere in the basic block with performing PRE optimizations.
4330          Check this.  */
4331       if (pre
4332           && !TEST_BIT (antloc[bb], expr->bitmap_index)
4333           && !TEST_BIT (transp[bb], expr->bitmap_index))
4334         abort ();
4335
4336       /* Since different machines initialize their parameter registers
4337          in different orders, assume nothing.  Collect the set of all
4338          parameter registers.  */
4339       CLEAR_HARD_REG_SET (parm_regs);
4340       nparm_regs = 0;
4341       for (p = CALL_INSN_FUNCTION_USAGE (insn); p ; p = XEXP (p, 1))
4342         if (GET_CODE (XEXP (p, 0)) == USE
4343             && GET_CODE (XEXP (XEXP (p, 0), 0)) == REG)
4344           {
4345             int regno = REGNO (XEXP (XEXP (p, 0), 0));
4346             if (regno >= FIRST_PSEUDO_REGISTER)
4347               abort ();
4348             SET_HARD_REG_BIT (parm_regs, regno);
4349             nparm_regs++;
4350           }
4351
4352       /* Search backward for the first set of a register in this set.  */
4353       while (nparm_regs && BLOCK_HEAD (bb) != insn)
4354         {
4355           insn = PREV_INSN (insn);
4356           p = single_set (insn);
4357           if (p && GET_CODE (SET_DEST (p)) == REG
4358               && REGNO (SET_DEST (p)) < FIRST_PSEUDO_REGISTER
4359               && TEST_HARD_REG_BIT (parm_regs, REGNO (SET_DEST (p))))
4360             {
4361               CLEAR_HARD_REG_BIT (parm_regs, REGNO (SET_DEST (p)));
4362               nparm_regs--;
4363             }
4364         }
4365
4366       /* If we found all the parameter loads, then we want to insert
4367          before the first parameter load.
4368
4369          If we did not find all the parameter loads, then we might have
4370          stopped on the head of the block, which could be a CODE_LABEL.
4371          If we inserted before the CODE_LABEL, then we would be putting
4372          the insn in the wrong basic block.  In that case, put the insn
4373          after the CODE_LABEL.
4374
4375          ?!? Do we need to account for NOTE_INSN_BASIC_BLOCK here?  */
4376       if (GET_CODE (insn) != CODE_LABEL)
4377         {
4378           new_insn = emit_insn_before (pat, insn);
4379           if (BLOCK_HEAD (bb) == insn)
4380             BLOCK_HEAD (bb) = new_insn;
4381         }
4382       else
4383         {
4384           new_insn = emit_insn_after (pat, insn);
4385         }
4386     }
4387   else
4388     {
4389       new_insn = emit_insn_after (pat, insn);
4390       BLOCK_END (bb) = new_insn;
4391     }
4392
4393   /* Keep block number table up to date.
4394      Note, PAT could be a multiple insn sequence, we have to make
4395      sure that each insn in the sequence is handled.  */
4396   if (GET_CODE (pat) == SEQUENCE)
4397     {
4398       int i;
4399
4400       for (i = 0; i < XVECLEN (pat, 0); i++)
4401         {
4402           rtx insn = XVECEXP (pat, 0, i);
4403           set_block_num (insn, bb);
4404           if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
4405             add_label_notes (PATTERN (insn), new_insn);
4406           record_set_insn = insn;
4407           note_stores (PATTERN (insn), record_set_info);
4408         }
4409     }
4410   else
4411     {
4412       add_label_notes (SET_SRC (pat), new_insn);
4413       set_block_num (new_insn, bb);
4414       /* Keep register set table up to date.  */
4415       record_one_set (regno, new_insn);
4416     }
4417
4418   gcse_create_count++;
4419
4420   if (gcse_file)
4421     {
4422       fprintf (gcse_file, "PRE/HOIST: end of bb %d, insn %d, copying expression %d to reg %d\n",
4423                bb, INSN_UID (new_insn), expr->bitmap_index, regno);
4424     }
4425 }
4426
4427 /* Insert partially redundant expressions on edges in the CFG to make
4428    the expressions fully redundant.  */
4429
4430 static int
4431 pre_edge_insert (edge_list, index_map)
4432      struct edge_list *edge_list;
4433      struct expr **index_map;
4434 {
4435   int e, i, num_edges, set_size, did_insert = 0;
4436   sbitmap *inserted;
4437
4438   /* Where PRE_INSERT_MAP is nonzero, we add the expression on that edge
4439      if it reaches any of the deleted expressions.  */
4440
4441   set_size = pre_insert_map[0]->size;
4442   num_edges = NUM_EDGES (edge_list);
4443   inserted = sbitmap_vector_alloc (num_edges, n_exprs);
4444   sbitmap_vector_zero (inserted, num_edges);
4445
4446   for (e = 0; e < num_edges; e++)
4447     {
4448       int indx;
4449       basic_block pred = INDEX_EDGE_PRED_BB (edge_list, e);
4450       int bb = pred->index;
4451
4452       for (i = indx = 0; i < set_size; i++, indx += SBITMAP_ELT_BITS)
4453         {
4454           SBITMAP_ELT_TYPE insert = pre_insert_map[e]->elms[i];
4455           int j;
4456
4457           for (j = indx; insert && j < n_exprs; j++, insert >>= 1)
4458             {
4459               if ((insert & 1) != 0 && index_map[j]->reaching_reg != NULL_RTX)
4460                 {
4461                   struct expr *expr = index_map[j];
4462                   struct occr *occr;
4463
4464                   /* Now look at each deleted occurence of this expression.  */
4465                   for (occr = expr->antic_occr; occr != NULL; occr = occr->next)
4466                     {
4467                       if (! occr->deleted_p)
4468                         continue;
4469
4470                       /* Insert this expression on this edge if if it would
4471                          reach the deleted occurence in BB.  */
4472                       if (!TEST_BIT (inserted[e], j)
4473                           && (bb == ENTRY_BLOCK
4474                               || pre_expr_reaches_here_p (bb, expr,
4475                                                    BLOCK_NUM (occr->insn), 0,
4476                                                    NULL)))
4477                         {
4478                           rtx insn;
4479                           edge eg = INDEX_EDGE (edge_list, e);
4480                           /* We can't insert anything on an abnormal
4481                              and critical edge, so we insert the
4482                              insn at the end of the previous block. There
4483                              are several alternatives detailed in
4484                              Morgans book P277 (sec 10.5) for handling
4485                              this situation.  This one is easiest for now.  */
4486
4487                           if ((eg->flags & EDGE_ABNORMAL) == EDGE_ABNORMAL)
4488                             {
4489                               insert_insn_end_bb (index_map[j], bb, 0);
4490                             }
4491                           else
4492                             {
4493                               insn = process_insert_insn (index_map[j]);
4494                               insert_insn_on_edge (insn, eg);
4495                             }
4496                           if (gcse_file)
4497                             {
4498                               fprintf (gcse_file,
4499                                        "PRE/HOIST: edge (%d,%d), copy expression %d\n",
4500                                         bb,
4501                                         INDEX_EDGE_SUCC_BB (edge_list, e)->index, expr->bitmap_index);
4502                             }
4503                           SET_BIT (inserted[e], j);
4504                           did_insert = 1;
4505                           gcse_create_count++;
4506                         }
4507                     }
4508                 }
4509             }
4510         }
4511     }
4512   return did_insert;
4513 }
4514
4515 /* Copy the result of INSN to REG.
4516    INDX is the expression number.  */
4517
4518 static void
4519 pre_insert_copy_insn (expr, insn)
4520      struct expr *expr;
4521      rtx insn;
4522 {
4523   rtx reg = expr->reaching_reg;
4524   int regno = REGNO (reg);
4525   int indx = expr->bitmap_index;
4526   rtx set = single_set (insn);
4527   rtx new_insn;
4528   int bb = BLOCK_NUM (insn);
4529
4530   if (!set)
4531     abort ();
4532   new_insn = emit_insn_after (gen_rtx_SET (VOIDmode, reg, SET_DEST (set)),
4533                               insn);
4534   /* Keep block number table up to date.  */
4535   set_block_num (new_insn, bb);
4536   /* Keep register set table up to date.  */
4537   record_one_set (regno, new_insn);
4538   if (insn == BLOCK_END (bb))
4539     BLOCK_END (bb) = new_insn;
4540
4541   gcse_create_count++;
4542
4543   if (gcse_file)
4544     fprintf (gcse_file,
4545              "PRE: bb %d, insn %d, copy expression %d in insn %d to reg %d\n",
4546               BLOCK_NUM (insn), INSN_UID (new_insn), indx,
4547               INSN_UID (insn), regno);
4548 }
4549
4550 /* Copy available expressions that reach the redundant expression
4551    to `reaching_reg'.  */
4552
4553 static void
4554 pre_insert_copies ()
4555 {
4556   int i, bb;
4557
4558   /* For each available expression in the table, copy the result to
4559      `reaching_reg' if the expression reaches a deleted one.
4560
4561      ??? The current algorithm is rather brute force.
4562      Need to do some profiling.  */
4563
4564   for (i = 0; i < expr_hash_table_size; i++)
4565     {
4566       struct expr *expr;
4567
4568       for (expr = expr_hash_table[i]; expr != NULL; expr = expr->next_same_hash)
4569         {
4570           struct occr *occr;
4571
4572           /* If the basic block isn't reachable, PPOUT will be TRUE.
4573              However, we don't want to insert a copy here because the
4574              expression may not really be redundant.  So only insert
4575              an insn if the expression was deleted.
4576              This test also avoids further processing if the expression
4577              wasn't deleted anywhere.  */
4578           if (expr->reaching_reg == NULL)
4579             continue;
4580
4581           for (occr = expr->antic_occr; occr != NULL; occr = occr->next)
4582             {
4583               struct occr *avail;
4584
4585               if (! occr->deleted_p)
4586                 continue;
4587
4588               for (avail = expr->avail_occr; avail != NULL; avail = avail->next)
4589                 {
4590                   rtx insn = avail->insn;
4591
4592                   /* No need to handle this one if handled already.  */
4593                   if (avail->copied_p)
4594                     continue;
4595                   /* Don't handle this one if it's a redundant one.  */
4596                   if (TEST_BIT (pre_redundant_insns, INSN_CUID (insn)))
4597                     continue;
4598                   /* Or if the expression doesn't reach the deleted one.  */
4599                   if (! pre_expr_reaches_here_p (BLOCK_NUM (avail->insn), expr,
4600                                                  BLOCK_NUM (occr->insn),
4601                                                  1, NULL))
4602                     continue;
4603
4604                   /* Copy the result of avail to reaching_reg.  */
4605                   pre_insert_copy_insn (expr, insn);
4606                   avail->copied_p = 1;
4607                 }
4608             }
4609         }
4610     }
4611 }
4612
4613 /* Delete redundant computations.
4614    Deletion is done by changing the insn to copy the `reaching_reg' of
4615    the expression into the result of the SET.  It is left to later passes
4616    (cprop, cse2, flow, combine, regmove) to propagate the copy or eliminate it.
4617
4618    Returns non-zero if a change is made.  */
4619
4620 static int
4621 pre_delete ()
4622 {
4623   int i, bb, changed;
4624
4625   /* Compute the expressions which are redundant and need to be replaced by
4626      copies from the reaching reg to the target reg.  */
4627   for (bb = 0; bb < n_basic_blocks; bb++)
4628     sbitmap_copy (temp_bitmap[bb], pre_delete_map[bb]);
4629
4630   changed = 0;
4631   for (i = 0; i < expr_hash_table_size; i++)
4632     {
4633       struct expr *expr;
4634
4635       for (expr = expr_hash_table[i]; expr != NULL; expr = expr->next_same_hash)
4636         {
4637           struct occr *occr;
4638           int indx = expr->bitmap_index;
4639
4640           /* We only need to search antic_occr since we require
4641              ANTLOC != 0.  */
4642
4643           for (occr = expr->antic_occr; occr != NULL; occr = occr->next)
4644             {
4645               rtx insn = occr->insn;
4646               rtx set;
4647               int bb = BLOCK_NUM (insn);
4648
4649               if (TEST_BIT (temp_bitmap[bb], indx))
4650                 {
4651                   set = single_set (insn);
4652                   if (! set)
4653                     abort ();
4654
4655                   /* Create a pseudo-reg to store the result of reaching
4656                      expressions into.  Get the mode for the new pseudo
4657                      from the mode of the original destination pseudo.  */
4658                   if (expr->reaching_reg == NULL)
4659                     expr->reaching_reg
4660                       = gen_reg_rtx (GET_MODE (SET_DEST (set)));
4661
4662                   /* In theory this should never fail since we're creating
4663                      a reg->reg copy.
4664
4665                      However, on the x86 some of the movXX patterns actually
4666                      contain clobbers of scratch regs.  This may cause the
4667                      insn created by validate_change to not match any pattern
4668                      and thus cause validate_change to fail.   */
4669                   if (validate_change (insn, &SET_SRC (set),
4670                                        expr->reaching_reg, 0))
4671                     {
4672                       occr->deleted_p = 1;
4673                       SET_BIT (pre_redundant_insns, INSN_CUID (insn));
4674                       changed = 1;
4675                       gcse_subst_count++;
4676                     }
4677
4678                   if (gcse_file)
4679                     {
4680                       fprintf (gcse_file,
4681                                "PRE: redundant insn %d (expression %d) in bb %d, reaching reg is %d\n",
4682                                INSN_UID (insn), indx, bb, REGNO (expr->reaching_reg));
4683                     }
4684                 }
4685             }
4686         }
4687     }
4688
4689   return changed;
4690 }
4691
4692 /* Perform GCSE optimizations using PRE.
4693    This is called by one_pre_gcse_pass after all the dataflow analysis
4694    has been done.
4695
4696    This is based on the original Morel-Renvoise paper Fred Chow's thesis,
4697    and lazy code motion from Knoop, Ruthing and Steffen as described in
4698    Advanced Compiler Design and Implementation.
4699
4700    ??? A new pseudo reg is created to hold the reaching expression.
4701    The nice thing about the classical approach is that it would try to
4702    use an existing reg.  If the register can't be adequately optimized
4703    [i.e. we introduce reload problems], one could add a pass here to
4704    propagate the new register through the block.
4705
4706    ??? We don't handle single sets in PARALLELs because we're [currently]
4707    not able to copy the rest of the parallel when we insert copies to create
4708    full redundancies from partial redundancies.  However, there's no reason
4709    why we can't handle PARALLELs in the cases where there are no partial
4710    redundancies.  */
4711
4712 static int
4713 pre_gcse ()
4714 {
4715   int i, did_insert;
4716   int changed;
4717   struct expr **index_map;
4718
4719   /* Compute a mapping from expression number (`bitmap_index') to
4720      hash table entry.  */
4721
4722   index_map = (struct expr **) alloca (n_exprs * sizeof (struct expr *));
4723   bzero ((char *) index_map, n_exprs * sizeof (struct expr *));
4724   for (i = 0; i < expr_hash_table_size; i++)
4725     {
4726       struct expr *expr;
4727
4728       for (expr = expr_hash_table[i]; expr != NULL; expr = expr->next_same_hash)
4729         index_map[expr->bitmap_index] = expr;
4730     }
4731
4732   /* Reset bitmap used to track which insns are redundant.  */
4733   pre_redundant_insns = sbitmap_alloc (max_cuid);
4734   sbitmap_zero (pre_redundant_insns);
4735
4736   /* Delete the redundant insns first so that
4737      - we know what register to use for the new insns and for the other
4738        ones with reaching expressions
4739      - we know which insns are redundant when we go to create copies  */
4740   changed = pre_delete ();
4741
4742   did_insert = pre_edge_insert (edge_list, index_map);
4743   /* In other places with reaching expressions, copy the expression to the
4744      specially allocated pseudo-reg that reaches the redundant expr.  */
4745   pre_insert_copies ();
4746   if (did_insert)
4747     {
4748       commit_edge_insertions ();
4749       changed = 1;
4750     }
4751
4752   free (pre_redundant_insns);
4753
4754   return changed;
4755 }
4756
4757 /* Top level routine to perform one PRE GCSE pass.
4758
4759    Return non-zero if a change was made.  */
4760
4761 static int
4762 one_pre_gcse_pass (pass)
4763      int pass;
4764 {
4765   int changed = 0;
4766
4767   gcse_subst_count = 0;
4768   gcse_create_count = 0;
4769
4770   alloc_expr_hash_table (max_cuid);
4771   add_noreturn_fake_exit_edges ();
4772   compute_expr_hash_table ();
4773   if (gcse_file)
4774     dump_hash_table (gcse_file, "Expression", expr_hash_table,
4775                      expr_hash_table_size, n_exprs);
4776   if (n_exprs > 0)
4777     {
4778       alloc_pre_mem (n_basic_blocks, n_exprs);
4779       compute_pre_data ();
4780       changed |= pre_gcse ();
4781       free_edge_list (edge_list);
4782       free_pre_mem ();
4783     }
4784   remove_fake_edges ();
4785   free_expr_hash_table ();
4786
4787   if (gcse_file)
4788     {
4789       fprintf (gcse_file, "\n");
4790       fprintf (gcse_file, "PRE GCSE of %s, pass %d: %d bytes needed, %d substs, %d insns created\n",
4791                current_function_name, pass,
4792                bytes_used, gcse_subst_count, gcse_create_count);
4793     }
4794
4795   return changed;
4796 }
4797 \f
4798 /* If X contains any LABEL_REF's, add REG_LABEL notes for them to INSN.
4799    We have to add REG_LABEL notes, because the following loop optimization
4800    pass requires them.  */
4801
4802 /* ??? This is very similar to the loop.c add_label_notes function.  We
4803    could probably share code here.  */
4804
4805 /* ??? If there was a jump optimization pass after gcse and before loop,
4806    then we would not need to do this here, because jump would add the
4807    necessary REG_LABEL notes.  */
4808
4809 static void
4810 add_label_notes (x, insn)
4811      rtx x;
4812      rtx insn;
4813 {
4814   enum rtx_code code = GET_CODE (x);
4815   int i, j;
4816   const char *fmt;
4817
4818   if (code == LABEL_REF && !LABEL_REF_NONLOCAL_P (x))
4819     {
4820       /* This code used to ignore labels that referred to dispatch tables to
4821          avoid flow generating (slighly) worse code.
4822
4823          We no longer ignore such label references (see LABEL_REF handling in
4824          mark_jump_label for additional information).  */
4825       REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_LABEL, XEXP (x, 0),
4826                                             REG_NOTES (insn));
4827       return;
4828     }
4829
4830   fmt = GET_RTX_FORMAT (code);
4831   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
4832     {
4833       if (fmt[i] == 'e')
4834         add_label_notes (XEXP (x, i), insn);
4835       else if (fmt[i] == 'E')
4836         for (j = XVECLEN (x, i) - 1; j >= 0; j--)
4837           add_label_notes (XVECEXP (x, i, j), insn);
4838     }
4839 }
4840
4841 /* Compute transparent outgoing information for each block.
4842
4843    An expression is transparent to an edge unless it is killed by
4844    the edge itself.  This can only happen with abnormal control flow,
4845    when the edge is traversed through a call.  This happens with
4846    non-local labels and exceptions.
4847
4848    This would not be necessary if we split the edge.  While this is
4849    normally impossible for abnormal critical edges, with some effort
4850    it should be possible with exception handling, since we still have
4851    control over which handler should be invoked.  But due to increased
4852    EH table sizes, this may not be worthwhile.  */
4853
4854 static void
4855 compute_transpout ()
4856 {
4857   int bb;
4858
4859   sbitmap_vector_ones (transpout, n_basic_blocks);
4860
4861   for (bb = 0; bb < n_basic_blocks; ++bb)
4862     {
4863       int i;
4864
4865       /* Note that flow inserted a nop a the end of basic blocks that
4866          end in call instructions for reasons other than abnormal
4867          control flow.  */
4868       if (GET_CODE (BLOCK_END (bb)) != CALL_INSN)
4869         continue;
4870
4871       for (i = 0; i < expr_hash_table_size; i++)
4872         {
4873           struct expr *expr;
4874           for (expr = expr_hash_table[i]; expr ; expr = expr->next_same_hash)
4875             if (GET_CODE (expr->expr) == MEM)
4876               {
4877                 rtx addr = XEXP (expr->expr, 0);
4878
4879                 if (GET_CODE (addr) == SYMBOL_REF
4880                     && CONSTANT_POOL_ADDRESS_P (addr))
4881                   continue;
4882
4883                 /* ??? Optimally, we would use interprocedural alias
4884                    analysis to determine if this mem is actually killed
4885                    by this call.  */
4886                 RESET_BIT (transpout[bb], expr->bitmap_index);
4887               }
4888         }
4889     }
4890 }
4891
4892 /* Removal of useless null pointer checks */
4893
4894 /* These need to be file static for communication between
4895    invalidate_nonnull_info and delete_null_pointer_checks.  */
4896 static int current_block;
4897 static sbitmap *nonnull_local;
4898 static sbitmap *nonnull_killed;
4899
4900 /* Called via note_stores.  X is set by SETTER.  If X is a register we must
4901    invalidate nonnull_local and set nonnull_killed.
4902
4903    We ignore hard registers.  */
4904 static void
4905 invalidate_nonnull_info (x, setter)
4906      rtx x;
4907      rtx setter ATTRIBUTE_UNUSED;
4908 {
4909   int offset, regno;
4910
4911   offset = 0;
4912   while (GET_CODE (x) == SUBREG)
4913     x = SUBREG_REG (x);
4914
4915   /* Ignore anything that is not a register or is a hard register.  */
4916   if (GET_CODE (x) != REG
4917       || REGNO (x) < FIRST_PSEUDO_REGISTER)
4918     return;
4919
4920   regno = REGNO (x);
4921
4922   RESET_BIT (nonnull_local[current_block], regno);
4923   SET_BIT (nonnull_killed[current_block], regno);
4924
4925 }
4926
4927 /* Find EQ/NE comparisons against zero which can be (indirectly) evaluated
4928    at compile time.
4929
4930    This is conceptually similar to global constant/copy propagation and
4931    classic global CSE (it even uses the same dataflow equations as cprop).
4932
4933    If a register is used as memory address with the form (mem (reg)), then we
4934    know that REG can not be zero at that point in the program.  Any instruction
4935    which sets REG "kills" this property.
4936
4937    So, if every path leading to a conditional branch has an available memory
4938    reference of that form, then we know the register can not have the value
4939    zero at the conditional branch.
4940
4941    So we merely need to compute the local properies and propagate that data
4942    around the cfg, then optimize where possible.
4943
4944    We run this pass two times.  Once before CSE, then again after CSE.  This
4945    has proven to be the most profitable approach.  It is rare for new
4946    optimization opportunities of this nature to appear after the first CSE
4947    pass.
4948
4949    This could probably be integrated with global cprop with a little work.  */
4950
4951 void
4952 delete_null_pointer_checks (f)
4953      rtx f;
4954 {
4955   int_list_ptr *s_preds, *s_succs;
4956   int *num_preds, *num_succs;
4957   int changed, bb;
4958   sbitmap *nonnull_avin, *nonnull_avout;
4959
4960   /* First break the program into basic blocks.  */
4961   find_basic_blocks (f, max_reg_num (), NULL, 1);
4962
4963   /* If we have only a single block, then there's nothing to do.  */
4964   if (n_basic_blocks <= 1)
4965     {
4966       /* Free storage allocated by find_basic_blocks.  */
4967       free_basic_block_vars (0);
4968       return;
4969     }
4970
4971   /* Trying to perform global optimizations on flow graphs which have
4972      a high connectivity will take a long time and is unlikely to be
4973      particularly useful.
4974
4975      In normal circumstances a cfg should have about twice has many edges
4976      as blocks.  But we do not want to punish small functions which have
4977      a couple switch statements.  So we require a relatively large number
4978      of basic blocks and the ratio of edges to blocks to be high.  */
4979   if (n_basic_blocks > 1000 && n_edges / n_basic_blocks >= 20)
4980     {
4981       /* Free storage allocated by find_basic_blocks.  */
4982       free_basic_block_vars (0);
4983       return;
4984     }
4985
4986   /* We need predecessor/successor lists as well as pred/succ counts for
4987      each basic block.  */
4988   s_preds = (int_list_ptr *) alloca (n_basic_blocks * sizeof (int_list_ptr));
4989   s_succs = (int_list_ptr *) alloca (n_basic_blocks * sizeof (int_list_ptr));
4990   num_preds = (int *) alloca (n_basic_blocks * sizeof (int));
4991   num_succs = (int *) alloca (n_basic_blocks * sizeof (int));
4992   compute_preds_succs (s_preds, s_succs, num_preds, num_succs);
4993
4994   /* Allocate bitmaps to hold local and global properties.  */
4995   nonnull_local = sbitmap_vector_alloc (n_basic_blocks, max_reg_num ());
4996   nonnull_killed = sbitmap_vector_alloc (n_basic_blocks, max_reg_num ());
4997   nonnull_avin = sbitmap_vector_alloc (n_basic_blocks, max_reg_num ());
4998   nonnull_avout = sbitmap_vector_alloc (n_basic_blocks, max_reg_num ());
4999
5000   /* Compute local properties, nonnull and killed.  A register will have
5001      the nonnull property if at the end of the current block its value is
5002      known to be nonnull.  The killed property indicates that somewhere in
5003      the block any information we had about the register is killed.
5004
5005      Note that a register can have both properties in a single block.  That
5006      indicates that it's killed, then later in the block a new value is
5007      computed.  */
5008   sbitmap_vector_zero (nonnull_local, n_basic_blocks);
5009   sbitmap_vector_zero (nonnull_killed, n_basic_blocks);
5010   for (current_block = 0; current_block < n_basic_blocks; current_block++)
5011     {
5012       rtx insn, stop_insn;
5013
5014       /* Scan each insn in the basic block looking for memory references and
5015          register sets.  */
5016       stop_insn = NEXT_INSN (BLOCK_END (current_block));
5017       for (insn = BLOCK_HEAD (current_block);
5018            insn != stop_insn;
5019            insn = NEXT_INSN (insn))
5020         {
5021           rtx set;
5022
5023           /* Ignore anything that is not a normal insn.  */
5024           if (GET_RTX_CLASS (GET_CODE (insn)) != 'i')
5025             continue;
5026
5027           /* Basically ignore anything that is not a simple SET.  We do have
5028              to make sure to invalidate nonnull_local and set nonnull_killed
5029              for such insns though.  */
5030           set = single_set (insn);
5031           if (!set)
5032             {
5033               note_stores (PATTERN (insn), invalidate_nonnull_info);
5034               continue;
5035             }
5036
5037           /* See if we've got a useable memory load.  We handle it first
5038              in case it uses its address register as a dest (which kills
5039              the nonnull property).  */
5040           if (GET_CODE (SET_SRC (set)) == MEM
5041               && GET_CODE (XEXP (SET_SRC (set), 0)) == REG
5042               && REGNO (XEXP (SET_SRC (set), 0)) >= FIRST_PSEUDO_REGISTER)
5043             SET_BIT (nonnull_local[current_block],
5044                      REGNO (XEXP (SET_SRC (set), 0)));
5045
5046           /* Now invalidate stuff clobbered by this insn.  */
5047           note_stores (PATTERN (insn), invalidate_nonnull_info);
5048
5049           /* And handle stores, we do these last since any sets in INSN can
5050              not kill the nonnull property if it is derived from a MEM
5051              appearing in a SET_DEST.  */
5052           if (GET_CODE (SET_DEST (set)) == MEM
5053               && GET_CODE (XEXP (SET_DEST (set), 0)) == REG)
5054             SET_BIT (nonnull_local[current_block],
5055                      REGNO (XEXP (SET_DEST (set), 0)));
5056         }
5057     }
5058
5059   /* Now compute global properties based on the local properties.   This
5060      is a classic global availablity algorithm.  */
5061   sbitmap_zero (nonnull_avin[0]);
5062   sbitmap_vector_ones (nonnull_avout, n_basic_blocks);
5063   changed = 1;
5064   while (changed)
5065     {
5066       changed = 0;
5067
5068       for (bb = 0; bb < n_basic_blocks; bb++)
5069         {
5070           if (bb != 0)
5071             sbitmap_intersect_of_predecessors (nonnull_avin[bb],
5072                                                nonnull_avout, bb, s_preds);
5073
5074           changed |= sbitmap_union_of_diff (nonnull_avout[bb],
5075                                             nonnull_local[bb],
5076                                             nonnull_avin[bb],
5077                                             nonnull_killed[bb]);
5078         }
5079     }
5080
5081   /* Now look at each bb and see if it ends with a compare of a value
5082      against zero.  */
5083   for (bb = 0; bb < n_basic_blocks; bb++)
5084     {
5085       rtx last_insn = BLOCK_END (bb);
5086       rtx condition, earliest, reg;
5087       int compare_and_branch;
5088
5089       /* We only want conditional branches.  */
5090       if (GET_CODE (last_insn) != JUMP_INSN
5091           || !condjump_p (last_insn)
5092           || simplejump_p (last_insn))
5093         continue;
5094
5095       /* LAST_INSN is a conditional jump.  Get its condition.  */
5096       condition = get_condition (last_insn, &earliest);
5097
5098       /* If we were unable to get the condition, or it is not a equality
5099          comparison against zero then there's nothing we can do.  */
5100       if (!condition
5101           || (GET_CODE (condition) != NE && GET_CODE (condition) != EQ)
5102           || GET_CODE (XEXP (condition, 1)) != CONST_INT
5103           || XEXP (condition, 1) != CONST0_RTX (GET_MODE (XEXP (condition, 0))))
5104         continue;
5105
5106       /* We must be checking a register against zero.  */
5107       reg = XEXP (condition, 0);
5108       if (GET_CODE (reg) != REG)
5109         continue;
5110
5111       /* Is the register known to have a nonzero value?  */
5112       if (!TEST_BIT (nonnull_avout[bb], REGNO (reg)))
5113         continue;
5114
5115       /* Try to compute whether the compare/branch at the loop end is one or
5116          two instructions.  */
5117       if (earliest == last_insn)
5118         compare_and_branch = 1;
5119       else if (earliest == prev_nonnote_insn (last_insn))
5120         compare_and_branch = 2;
5121       else
5122         continue;
5123
5124       /* We know the register in this comparison is nonnull at exit from
5125          this block.  We can optimize this comparison.  */
5126       if (GET_CODE (condition) == NE)
5127         {
5128           rtx new_jump;
5129
5130           new_jump = emit_jump_insn_before (gen_jump (JUMP_LABEL (last_insn)),
5131                                             last_insn);
5132           JUMP_LABEL (new_jump) = JUMP_LABEL (last_insn);
5133           LABEL_NUSES (JUMP_LABEL (new_jump))++;
5134           emit_barrier_after (new_jump);
5135         }
5136       delete_insn (last_insn);
5137       if (compare_and_branch == 2)
5138         delete_insn (earliest);
5139     }
5140
5141   /* Free storage allocated by find_basic_blocks.  */
5142   free_basic_block_vars (0);
5143
5144   /* Free bitmaps.  */
5145   free (nonnull_local);
5146   free (nonnull_killed);
5147   free (nonnull_avin);
5148   free (nonnull_avout);
5149 }
5150
5151 /* Code Hoisting variables and subroutines.  */
5152
5153 /* Very busy expressions.  */
5154 static sbitmap *hoist_vbein;
5155 static sbitmap *hoist_vbeout;
5156
5157 /* Hoistable expressions.  */
5158 static sbitmap *hoist_exprs;
5159
5160 /* Dominator bitmaps.  */
5161 static sbitmap *dominators;
5162 static sbitmap *post_dominators;
5163
5164 /* ??? We could compute post dominators and run this algorithm in
5165    reverse to to perform tail merging, doing so would probably be
5166    more effective than the tail merging code in jump.c.
5167
5168    It's unclear if tail merging could be run in parallel with
5169    code hoisting.  It would be nice.  */
5170
5171 /* Allocate vars used for code hoisting analysis.  */
5172
5173 static void
5174 alloc_code_hoist_mem (n_blocks, n_exprs)
5175      int n_blocks, n_exprs;
5176 {
5177   antloc = sbitmap_vector_alloc (n_blocks, n_exprs);
5178   transp = sbitmap_vector_alloc (n_blocks, n_exprs);
5179   comp = sbitmap_vector_alloc (n_blocks, n_exprs);
5180
5181   hoist_vbein = sbitmap_vector_alloc (n_blocks, n_exprs);
5182   hoist_vbeout = sbitmap_vector_alloc (n_blocks, n_exprs);
5183   hoist_exprs = sbitmap_vector_alloc (n_blocks, n_exprs);
5184   transpout = sbitmap_vector_alloc (n_blocks, n_exprs);
5185
5186   dominators = sbitmap_vector_alloc (n_blocks, n_blocks);
5187   post_dominators = sbitmap_vector_alloc (n_blocks, n_blocks);
5188 }
5189
5190 /* Free vars used for code hoisting analysis.  */
5191
5192 static void
5193 free_code_hoist_mem ()
5194 {
5195   free (antloc);
5196   free (transp);
5197   free (comp);
5198
5199   free (hoist_vbein);
5200   free (hoist_vbeout);
5201   free (hoist_exprs);
5202   free (transpout);
5203
5204   free (dominators);
5205   free (post_dominators);
5206 }
5207
5208 /* Compute the very busy expressions at entry/exit from each block.
5209
5210    An expression is very busy if all paths from a given point
5211    compute the expression.  */
5212
5213 static void
5214 compute_code_hoist_vbeinout ()
5215 {
5216   int bb, changed, passes;
5217
5218   sbitmap_vector_zero (hoist_vbeout, n_basic_blocks);
5219   sbitmap_vector_zero (hoist_vbein, n_basic_blocks);
5220
5221   passes = 0;
5222   changed = 1;
5223   while (changed)
5224     {
5225       changed = 0;
5226       /* We scan the blocks in the reverse order to speed up
5227          the convergence.  */
5228       for (bb = n_basic_blocks - 1; bb >= 0; bb--)
5229         {
5230           changed |= sbitmap_a_or_b_and_c (hoist_vbein[bb], antloc[bb],
5231                                            hoist_vbeout[bb], transp[bb]);
5232           if (bb != n_basic_blocks - 1)
5233             sbitmap_intersection_of_succs (hoist_vbeout[bb], hoist_vbein, bb);
5234         }
5235       passes++;
5236     }
5237
5238   if (gcse_file)
5239     fprintf (gcse_file, "hoisting vbeinout computation: %d passes\n", passes);
5240 }
5241
5242 /* Top level routine to do the dataflow analysis needed by code hoisting.  */
5243
5244 static void
5245 compute_code_hoist_data ()
5246 {
5247   compute_local_properties (transp, comp, antloc, 0);
5248   compute_transpout ();
5249   compute_code_hoist_vbeinout ();
5250   compute_flow_dominators (dominators, post_dominators);
5251   if (gcse_file)
5252     fprintf (gcse_file, "\n");
5253 }
5254
5255 /* Determine if the expression identified by EXPR_INDEX would
5256    reach BB unimpared if it was placed at the end of EXPR_BB.
5257
5258    It's unclear exactly what Muchnick meant by "unimpared".  It seems
5259    to me that the expression must either be computed or transparent in
5260    *every* block in the path(s) from EXPR_BB to BB.  Any other definition
5261    would allow the expression to be hoisted out of loops, even if
5262    the expression wasn't a loop invariant.
5263
5264    Contrast this to reachability for PRE where an expression is
5265    considered reachable if *any* path reaches instead of *all*
5266    paths.  */
5267
5268 static int
5269 hoist_expr_reaches_here_p (expr_bb, expr_index, bb, visited)
5270      int expr_bb;
5271      int expr_index;
5272      int bb;
5273      char *visited;
5274 {
5275   edge pred;
5276
5277   if (visited == NULL)
5278     {
5279       visited = (char *) alloca (n_basic_blocks);
5280       bzero (visited, n_basic_blocks);
5281     }
5282
5283   visited[expr_bb] = 1;
5284   for (pred = BASIC_BLOCK (bb)->pred; pred != NULL; pred = pred->pred_next)
5285     {
5286       int pred_bb = pred->src->index;
5287
5288       if (pred->src == ENTRY_BLOCK_PTR)
5289         break;
5290       else if (visited[pred_bb])
5291         continue;
5292       /* Does this predecessor generate this expression?  */
5293       else if (TEST_BIT (comp[pred_bb], expr_index))
5294         break;
5295       else if (! TEST_BIT (transp[pred_bb], expr_index))
5296         break;
5297       /* Not killed.  */
5298       else
5299         {
5300           visited[pred_bb] = 1;
5301           if (! hoist_expr_reaches_here_p (expr_bb, expr_index,
5302                                            pred_bb, visited))
5303             break;
5304         }
5305     }
5306
5307   return (pred == NULL);
5308 }
5309 \f
5310 /* Actually perform code hoisting.  */
5311 static void
5312 hoist_code ()
5313 {
5314   int bb, dominated, i;
5315   struct expr **index_map;
5316
5317   sbitmap_vector_zero (hoist_exprs, n_basic_blocks);
5318
5319   /* Compute a mapping from expression number (`bitmap_index') to
5320      hash table entry.  */
5321
5322   index_map = (struct expr **) alloca (n_exprs * sizeof (struct expr *));
5323   bzero ((char *) index_map, n_exprs * sizeof (struct expr *));
5324   for (i = 0; i < expr_hash_table_size; i++)
5325     {
5326       struct expr *expr;
5327
5328       for (expr = expr_hash_table[i]; expr != NULL; expr = expr->next_same_hash)
5329         index_map[expr->bitmap_index] = expr;
5330     }
5331
5332   /* Walk over each basic block looking for potentially hoistable
5333      expressions, nothing gets hoisted from the entry block.  */
5334   for (bb = 0; bb < n_basic_blocks; bb++)
5335     {
5336       int found = 0;
5337       int insn_inserted_p;
5338
5339       /* Examine each expression that is very busy at the exit of this
5340          block.  These are the potentially hoistable expressions.  */
5341       for (i = 0; i < hoist_vbeout[bb]->n_bits; i++)
5342         {
5343           int hoistable = 0;
5344           if (TEST_BIT (hoist_vbeout[bb], i)
5345               && TEST_BIT (transpout[bb], i))
5346             {
5347               /* We've found a potentially hoistable expression, now
5348                  we look at every block BB dominates to see if it
5349                  computes the expression.  */
5350               for (dominated = 0; dominated < n_basic_blocks; dominated++)
5351                 {
5352                   /* Ignore self dominance.  */
5353                   if (bb == dominated
5354                       || ! TEST_BIT (dominators[dominated], bb))
5355                     continue;
5356
5357                   /* We've found a dominated block, now see if it computes
5358                      the busy expression and whether or not moving that
5359                      expression to the "beginning" of that block is safe.  */
5360                   if (!TEST_BIT (antloc[dominated], i))
5361                     continue;
5362
5363                   /* Note if the expression would reach the dominated block
5364                      unimpared if it was placed at the end of BB.
5365
5366                      Keep track of how many times this expression is hoistable
5367                      from a dominated block into BB.  */
5368                   if (hoist_expr_reaches_here_p (bb, i, dominated, NULL))
5369                     hoistable++;
5370                 }
5371
5372               /* If we found more than one hoistable occurence of this
5373                  expression, then note it in the bitmap of expressions to
5374                  hoist.  It makes no sense to hoist things which are computed
5375                  in only one BB, and doing so tends to pessimize register
5376                  allocation.  One could increase this value to try harder
5377                  to avoid any possible code expansion due to register
5378                  allocation issues; however experiments have shown that
5379                  the vast majority of hoistable expressions are only movable
5380                  from two successors, so raising this threshhold is likely
5381                  to nullify any benefit we get from code hoisting.  */
5382               if (hoistable > 1)
5383                 {
5384                   SET_BIT (hoist_exprs[bb], i);
5385                   found = 1;
5386                 }
5387             }
5388         }
5389
5390       /* If we found nothing to hoist, then quit now.  */
5391       if (! found)
5392         continue;
5393
5394       /* Loop over all the hoistable expressions.  */
5395       for (i = 0; i < hoist_exprs[bb]->n_bits; i++)
5396         {
5397           /* We want to insert the expression into BB only once, so
5398              note when we've inserted it.  */
5399           insn_inserted_p = 0;
5400
5401           /* These tests should be the same as the tests above.  */
5402           if (TEST_BIT (hoist_vbeout[bb], i))
5403             {
5404               /* We've found a potentially hoistable expression, now
5405                  we look at every block BB dominates to see if it
5406                  computes the expression.  */
5407               for (dominated = 0; dominated < n_basic_blocks; dominated++)
5408                 {
5409                   /* Ignore self dominance.  */
5410                   if (bb == dominated
5411                       || ! TEST_BIT (dominators[dominated], bb))
5412                     continue;
5413
5414                   /* We've found a dominated block, now see if it computes
5415                      the busy expression and whether or not moving that
5416                      expression to the "beginning" of that block is safe.  */
5417                   if (!TEST_BIT (antloc[dominated], i))
5418                     continue;
5419
5420                   /* The expression is computed in the dominated block and
5421                      it would be safe to compute it at the start of the
5422                      dominated block.  Now we have to determine if the
5423                      expresion would reach the dominated block if it was
5424                      placed at the end of BB.  */
5425                   if (hoist_expr_reaches_here_p (bb, i, dominated, NULL))
5426                     {
5427                       struct expr *expr = index_map[i];
5428                       struct occr *occr = expr->antic_occr;
5429                       rtx insn;
5430                       rtx set;
5431
5432
5433                       /* Find the right occurence of this expression.  */
5434                       while (BLOCK_NUM (occr->insn) != dominated && occr)
5435                         occr = occr->next;
5436
5437                       /* Should never happen.  */
5438                       if (!occr)
5439                         abort ();
5440
5441                       insn = occr->insn;
5442
5443                       set = single_set (insn);
5444                       if (! set)
5445                         abort ();
5446
5447                       /* Create a pseudo-reg to store the result of reaching
5448                          expressions into.  Get the mode for the new pseudo
5449                          from the mode of the original destination pseudo.  */
5450                       if (expr->reaching_reg == NULL)
5451                         expr->reaching_reg
5452                           = gen_reg_rtx (GET_MODE (SET_DEST (set)));
5453
5454                       /* In theory this should never fail since we're creating
5455                          a reg->reg copy.
5456
5457                          However, on the x86 some of the movXX patterns actually
5458                          contain clobbers of scratch regs.  This may cause the
5459                          insn created by validate_change to not match any
5460                          pattern and thus cause validate_change to fail.   */
5461                       if (validate_change (insn, &SET_SRC (set),
5462                                            expr->reaching_reg, 0))
5463                         {
5464                           occr->deleted_p = 1;
5465                           if (!insn_inserted_p)
5466                             {
5467                               insert_insn_end_bb (index_map[i], bb, 0);
5468                               insn_inserted_p = 1;
5469                             }
5470                         }
5471                     }
5472                 }
5473             }
5474         }
5475     }
5476 }
5477
5478 /* Top level routine to perform one code hoisting (aka unification) pass
5479
5480    Return non-zero if a change was made.  */
5481
5482 static int
5483 one_code_hoisting_pass ()
5484 {
5485   int changed = 0;
5486
5487   alloc_expr_hash_table (max_cuid);
5488   compute_expr_hash_table ();
5489   if (gcse_file)
5490     dump_hash_table (gcse_file, "Code Hosting Expressions", expr_hash_table,
5491                      expr_hash_table_size, n_exprs);
5492   if (n_exprs > 0)
5493     {
5494       alloc_code_hoist_mem (n_basic_blocks, n_exprs);
5495       compute_code_hoist_data ();
5496       hoist_code ();
5497       free_code_hoist_mem ();
5498     }
5499   free_expr_hash_table ();
5500
5501   return changed;
5502 }