gcc/tree-ssa-threadupdate.c

   1 /* Thread edges through blocks and update the control flow and SSA graphs.
   2    Copyright (C) 2004-2017 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify
   7 it under the terms of the GNU General Public License as published by
   8 the Free Software Foundation; either version 3, or (at your option)
   9 any later version.
  10
  11 GCC is distributed in the hope that it will be useful,
  12 but WITHOUT ANY WARRANTY; without even the implied warranty of
  13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14 GNU General Public License for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 #include "config.h"
  21 #include "system.h"
  22 #include "coretypes.h"
  23 #include "backend.h"
  24 #include "tree.h"
  25 #include "gimple.h"
  26 #include "cfghooks.h"
  27 #include "tree-pass.h"
  28 #include "ssa.h"
  29 #include "fold-const.h"
  30 #include "cfganal.h"
  31 #include "gimple-iterator.h"
  32 #include "tree-ssa.h"
  33 #include "tree-ssa-threadupdate.h"
  34 #include "cfgloop.h"
  35 #include "dbgcnt.h"
  36 #include "tree-cfg.h"
  37 #include "tree-vectorizer.h"
  38
  39 /* Given a block B, update the CFG and SSA graph to reflect redirecting
  40    one or more in-edges to B to instead reach the destination of an
  41    out-edge from B while preserving any side effects in B.
  42
  43    i.e., given A->B and B->C, change A->B to be A->C yet still preserve the
  44    side effects of executing B.
  45
  46      1. Make a copy of B (including its outgoing edges and statements).  Call
  47         the copy B'.  Note B' has no incoming edges or PHIs at this time.
  48
  49      2. Remove the control statement at the end of B' and all outgoing edges
  50         except B'->C.
  51
  52      3. Add a new argument to each PHI in C with the same value as the existing
  53         argument associated with edge B->C.  Associate the new PHI arguments
  54         with the edge B'->C.
  55
  56      4. For each PHI in B, find or create a PHI in B' with an identical
  57         PHI_RESULT.  Add an argument to the PHI in B' which has the same
  58         value as the PHI in B associated with the edge A->B.  Associate
  59         the new argument in the PHI in B' with the edge A->B.
  60
  61      5. Change the edge A->B to A->B'.
  62
  63         5a. This automatically deletes any PHI arguments associated with the
  64             edge A->B in B.
  65
  66         5b. This automatically associates each new argument added in step 4
  67             with the edge A->B'.
  68
  69      6. Repeat for other incoming edges into B.
  70
  71      7. Put the duplicated resources in B and all the B' blocks into SSA form.
  72
  73    Note that block duplication can be minimized by first collecting the
  74    set of unique destination blocks that the incoming edges should
  75    be threaded to.
  76
  77    We reduce the number of edges and statements we create by not copying all
  78    the outgoing edges and the control statement in step #1.  We instead create
  79    a template block without the outgoing edges and duplicate the template.
  80
  81    Another case this code handles is threading through a "joiner" block.  In
  82    this case, we do not know the destination of the joiner block, but one
  83    of the outgoing edges from the joiner block leads to a threadable path.  This
  84    case largely works as outlined above, except the duplicate of the joiner
  85    block still contains a full set of outgoing edges and its control statement.
  86    We just redirect one of its outgoing edges to our jump threading path.  */
  87
  88
  89 /* Steps #5 and #6 of the above algorithm are best implemented by walking
  90    all the incoming edges which thread to the same destination edge at
  91    the same time.  That avoids lots of table lookups to get information
  92    for the destination edge.
  93
  94    To realize that implementation we create a list of incoming edges
  95    which thread to the same outgoing edge.  Thus to implement steps
  96    #5 and #6 we traverse our hash table of outgoing edge information.
  97    For each entry we walk the list of incoming edges which thread to
  98    the current outgoing edge.  */
  99
 100 struct el
 101 {
 102   edge e;
 103   struct el *next;
 104 };
 105
 106 /* Main data structure recording information regarding B's duplicate
 107    blocks.  */
 108
 109 /* We need to efficiently record the unique thread destinations of this
 110    block and specific information associated with those destinations.  We
 111    may have many incoming edges threaded to the same outgoing edge.  This
 112    can be naturally implemented with a hash table.  */
 113
 114 struct redirection_data : free_ptr_hash<redirection_data>
 115 {
 116   /* We support wiring up two block duplicates in a jump threading path.
 117
 118      One is a normal block copy where we remove the control statement
 119      and wire up its single remaining outgoing edge to the thread path.
 120
 121      The other is a joiner block where we leave the control statement
 122      in place, but wire one of the outgoing edges to a thread path.
 123
 124      In theory we could have multiple block duplicates in a jump
 125      threading path, but I haven't tried that.
 126
 127      The duplicate blocks appear in this array in the same order in
 128      which they appear in the jump thread path.  */
 129   basic_block dup_blocks[2];
 130
 131   /* The jump threading path.  */
 132   vec<jump_thread_edge *> *path;
 133
 134   /* A list of incoming edges which we want to thread to the
 135      same path.  */
 136   struct el *incoming_edges;
 137
 138   /* hash_table support.  */
 139   static inline hashval_t hash (const redirection_data *);
 140   static inline int equal (const redirection_data *, const redirection_data *);
 141 };
 142
 143 /* Dump a jump threading path, including annotations about each
 144    edge in the path.  */
 145
 146 static void
 147 dump_jump_thread_path (FILE *dump_file, vec<jump_thread_edge *> path,
 148                        bool registering)
 149 {
 150   fprintf (dump_file,
 151            "  %s%s jump thread: (%d, %d) incoming edge; ",
 152            (registering ? "Registering" : "Cancelling"),
 153            (path[0]->type == EDGE_FSM_THREAD ? " FSM": ""),
 154            path[0]->e->src->index, path[0]->e->dest->index);
 155
 156   for (unsigned int i = 1; i < path.length (); i++)
 157     {
 158       /* We can get paths with a NULL edge when the final destination
 159          of a jump thread turns out to be a constant address.  We dump
 160          those paths when debugging, so we have to be prepared for that
 161          possibility here.  */
 162       if (path[i]->e == NULL)
 163         continue;
 164
 165       if (path[i]->type == EDGE_COPY_SRC_JOINER_BLOCK)
 166         fprintf (dump_file, " (%d, %d) joiner; ",
 167                  path[i]->e->src->index, path[i]->e->dest->index);
 168       if (path[i]->type == EDGE_COPY_SRC_BLOCK)
 169        fprintf (dump_file, " (%d, %d) normal;",
 170                  path[i]->e->src->index, path[i]->e->dest->index);
 171       if (path[i]->type == EDGE_NO_COPY_SRC_BLOCK)
 172        fprintf (dump_file, " (%d, %d) nocopy;",
 173                  path[i]->e->src->index, path[i]->e->dest->index);
 174       if (path[0]->type == EDGE_FSM_THREAD)
 175         fprintf (dump_file, " (%d, %d) ",
 176                  path[i]->e->src->index, path[i]->e->dest->index);
 177     }
 178   fputc ('\n', dump_file);
 179 }
 180
 181 /* Simple hashing function.  For any given incoming edge E, we're going
 182    to be most concerned with the final destination of its jump thread
 183    path.  So hash on the block index of the final edge in the path.  */
 184
 185 inline hashval_t
 186 redirection_data::hash (const redirection_data *p)
 187 {
 188   vec<jump_thread_edge *> *path = p->path;
 189   return path->last ()->e->dest->index;
 190 }
 191
 192 /* Given two hash table entries, return true if they have the same
 193    jump threading path.  */
 194 inline int
 195 redirection_data::equal (const redirection_data *p1, const redirection_data *p2)
 196 {
 197   vec<jump_thread_edge *> *path1 = p1->path;
 198   vec<jump_thread_edge *> *path2 = p2->path;
 199
 200   if (path1->length () != path2->length ())
 201     return false;
 202
 203   for (unsigned int i = 1; i < path1->length (); i++)
 204     {
 205       if ((*path1)[i]->type != (*path2)[i]->type
 206           || (*path1)[i]->e != (*path2)[i]->e)
 207         return false;
 208     }
 209
 210   return true;
 211 }
 212
 213 /* Rather than search all the edges in jump thread paths each time
 214    DOM is able to simply if control statement, we build a hash table
 215    with the deleted edges.  We only care about the address of the edge,
 216    not its contents.  */
 217 struct removed_edges : nofree_ptr_hash<edge_def>
 218 {
 219   static hashval_t hash (edge e) { return htab_hash_pointer (e); }
 220   static bool equal (edge e1, edge e2) { return e1 == e2; }
 221 };
 222
 223 static hash_table<removed_edges> *removed_edges;
 224
 225 /* Data structure of information to pass to hash table traversal routines.  */
 226 struct ssa_local_info_t
 227 {
 228   /* The current block we are working on.  */
 229   basic_block bb;
 230
 231   /* We only create a template block for the first duplicated block in a
 232      jump threading path as we may need many duplicates of that block.
 233
 234      The second duplicate block in a path is specific to that path.  Creating
 235      and sharing a template for that block is considerably more difficult.  */
 236   basic_block template_block;
 237
 238   /* Blocks duplicated for the thread.  */
 239   bitmap duplicate_blocks;
 240
 241   /* TRUE if we thread one or more jumps, FALSE otherwise.  */
 242   bool jumps_threaded;
 243
 244   /* When we have multiple paths through a joiner which reach different
 245      final destinations, then we may need to correct for potential
 246      profile insanities.  */
 247   bool need_profile_correction;
 248 };
 249
 250 /* Passes which use the jump threading code register jump threading
 251    opportunities as they are discovered.  We keep the registered
 252    jump threading opportunities in this vector as edge pairs
 253    (original_edge, target_edge).  */
 254 static vec<vec<jump_thread_edge *> *> paths;
 255
 256 /* When we start updating the CFG for threading, data necessary for jump
 257    threading is attached to the AUX field for the incoming edge.  Use these
 258    macros to access the underlying structure attached to the AUX field.  */
 259 #define THREAD_PATH(E) ((vec<jump_thread_edge *> *)(E)->aux)
 260
 261 /* Jump threading statistics.  */
 262
 263 struct thread_stats_d
 264 {
 265   unsigned long num_threaded_edges;
 266 };
 267
 268 struct thread_stats_d thread_stats;
 269
 270
 271 /* Remove the last statement in block BB if it is a control statement
 272    Also remove all outgoing edges except the edge which reaches DEST_BB.
 273    If DEST_BB is NULL, then remove all outgoing edges.  */
 274
 275 void
 276 remove_ctrl_stmt_and_useless_edges (basic_block bb, basic_block dest_bb)
 277 {
 278   gimple_stmt_iterator gsi;
 279   edge e;
 280   edge_iterator ei;
 281
 282   gsi = gsi_last_bb (bb);
 283
 284   /* If the duplicate ends with a control statement, then remove it.
 285
 286      Note that if we are duplicating the template block rather than the
 287      original basic block, then the duplicate might not have any real
 288      statements in it.  */
 289   if (!gsi_end_p (gsi)
 290       && gsi_stmt (gsi)
 291       && (gimple_code (gsi_stmt (gsi)) == GIMPLE_COND
 292           || gimple_code (gsi_stmt (gsi)) == GIMPLE_GOTO
 293           || gimple_code (gsi_stmt (gsi)) == GIMPLE_SWITCH))
 294     gsi_remove (&gsi, true);
 295
 296   for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
 297     {
 298       if (e->dest != dest_bb)
 299         {
 300           free_dom_edge_info (e);
 301           remove_edge (e);
 302         }
 303       else
 304         {
 305           e->probability = REG_BR_PROB_BASE;
 306           e->count = bb->count;
 307           ei_next (&ei);
 308         }
 309     }
 310
 311   /* If the remaining edge is a loop exit, there must have
 312      a removed edge that was not a loop exit.
 313
 314      In that case BB and possibly other blocks were previously
 315      in the loop, but are now outside the loop.  Thus, we need
 316      to update the loop structures.  */
 317   if (single_succ_p (bb)
 318       && loop_outer (bb->loop_father)
 319       && loop_exit_edge_p (bb->loop_father, single_succ_edge (bb)))
 320     loops_state_set (LOOPS_NEED_FIXUP);
 321 }
 322
 323 /* Create a duplicate of BB.  Record the duplicate block in an array
 324    indexed by COUNT stored in RD.  */
 325
 326 static void
 327 create_block_for_threading (basic_block bb,
 328                             struct redirection_data *rd,
 329                             unsigned int count,
 330                             bitmap *duplicate_blocks)
 331 {
 332   edge_iterator ei;
 333   edge e;
 334
 335   /* We can use the generic block duplication code and simply remove
 336      the stuff we do not need.  */
 337   rd->dup_blocks[count] = duplicate_block (bb, NULL, NULL);
 338
 339   FOR_EACH_EDGE (e, ei, rd->dup_blocks[count]->succs)
 340     e->aux = NULL;
 341
 342   /* Zero out the profile, since the block is unreachable for now.  */
 343   rd->dup_blocks[count]->frequency = 0;
 344   rd->dup_blocks[count]->count = profile_count::uninitialized ();
 345   if (duplicate_blocks)
 346     bitmap_set_bit (*duplicate_blocks, rd->dup_blocks[count]->index);
 347 }
 348
 349 /* Main data structure to hold information for duplicates of BB.  */
 350
 351 static hash_table<redirection_data> *redirection_data;
 352
 353 /* Given an outgoing edge E lookup and return its entry in our hash table.
 354
 355    If INSERT is true, then we insert the entry into the hash table if
 356    it is not already present.  INCOMING_EDGE is added to the list of incoming
 357    edges associated with E in the hash table.  */
 358
 359 static struct redirection_data *
 360 lookup_redirection_data (edge e, enum insert_option insert)
 361 {
 362   struct redirection_data **slot;
 363   struct redirection_data *elt;
 364   vec<jump_thread_edge *> *path = THREAD_PATH (e);
 365
 366   /* Build a hash table element so we can see if E is already
 367      in the table.  */
 368   elt = XNEW (struct redirection_data);
 369   elt->path = path;
 370   elt->dup_blocks[0] = NULL;
 371   elt->dup_blocks[1] = NULL;
 372   elt->incoming_edges = NULL;
 373
 374   slot = redirection_data->find_slot (elt, insert);
 375
 376   /* This will only happen if INSERT is false and the entry is not
 377      in the hash table.  */
 378   if (slot == NULL)
 379     {
 380       free (elt);
 381       return NULL;
 382     }
 383
 384   /* This will only happen if E was not in the hash table and
 385      INSERT is true.  */
 386   if (*slot == NULL)
 387     {
 388       *slot = elt;
 389       elt->incoming_edges = XNEW (struct el);
 390       elt->incoming_edges->e = e;
 391       elt->incoming_edges->next = NULL;
 392       return elt;
 393     }
 394   /* E was in the hash table.  */
 395   else
 396     {
 397       /* Free ELT as we do not need it anymore, we will extract the
 398          relevant entry from the hash table itself.  */
 399       free (elt);
 400
 401       /* Get the entry stored in the hash table.  */
 402       elt = *slot;
 403
 404       /* If insertion was requested, then we need to add INCOMING_EDGE
 405          to the list of incoming edges associated with E.  */
 406       if (insert)
 407         {
 408           struct el *el = XNEW (struct el);
 409           el->next = elt->incoming_edges;
 410           el->e = e;
 411           elt->incoming_edges = el;
 412         }
 413
 414       return elt;
 415     }
 416 }
 417
 418 /* Similar to copy_phi_args, except that the PHI arg exists, it just
 419    does not have a value associated with it.  */
 420
 421 static void
 422 copy_phi_arg_into_existing_phi (edge src_e, edge tgt_e)
 423 {
 424   int src_idx = src_e->dest_idx;
 425   int tgt_idx = tgt_e->dest_idx;
 426
 427   /* Iterate over each PHI in e->dest.  */
 428   for (gphi_iterator gsi = gsi_start_phis (src_e->dest),
 429                            gsi2 = gsi_start_phis (tgt_e->dest);
 430        !gsi_end_p (gsi);
 431        gsi_next (&gsi), gsi_next (&gsi2))
 432     {
 433       gphi *src_phi = gsi.phi ();
 434       gphi *dest_phi = gsi2.phi ();
 435       tree val = gimple_phi_arg_def (src_phi, src_idx);
 436       source_location locus = gimple_phi_arg_location (src_phi, src_idx);
 437
 438       SET_PHI_ARG_DEF (dest_phi, tgt_idx, val);
 439       gimple_phi_arg_set_location (dest_phi, tgt_idx, locus);
 440     }
 441 }
 442
 443 /* Given ssa_name DEF, backtrack jump threading PATH from node IDX
 444    to see if it has constant value in a flow sensitive manner.  Set
 445    LOCUS to location of the constant phi arg and return the value.
 446    Return DEF directly if either PATH or idx is ZERO.  */
 447
 448 static tree
 449 get_value_locus_in_path (tree def, vec<jump_thread_edge *> *path,
 450                          basic_block bb, int idx, source_location *locus)
 451 {
 452   tree arg;
 453   gphi *def_phi;
 454   basic_block def_bb;
 455
 456   if (path == NULL || idx == 0)
 457     return def;
 458
 459   def_phi = dyn_cast <gphi *> (SSA_NAME_DEF_STMT (def));
 460   if (!def_phi)
 461     return def;
 462
 463   def_bb = gimple_bb (def_phi);
 464   /* Don't propagate loop invariants into deeper loops.  */
 465   if (!def_bb || bb_loop_depth (def_bb) < bb_loop_depth (bb))
 466     return def;
 467
 468   /* Backtrack jump threading path from IDX to see if def has constant
 469      value.  */
 470   for (int j = idx - 1; j >= 0; j--)
 471     {
 472       edge e = (*path)[j]->e;
 473       if (e->dest == def_bb)
 474         {
 475           arg = gimple_phi_arg_def (def_phi, e->dest_idx);
 476           if (is_gimple_min_invariant (arg))
 477             {
 478               *locus = gimple_phi_arg_location (def_phi, e->dest_idx);
 479               return arg;
 480             }
 481           break;
 482         }
 483     }
 484
 485   return def;
 486 }
 487
 488 /* For each PHI in BB, copy the argument associated with SRC_E to TGT_E.
 489    Try to backtrack jump threading PATH from node IDX to see if the arg
 490    has constant value, copy constant value instead of argument itself
 491    if yes.  */
 492
 493 static void
 494 copy_phi_args (basic_block bb, edge src_e, edge tgt_e,
 495                vec<jump_thread_edge *> *path, int idx)
 496 {
 497   gphi_iterator gsi;
 498   int src_indx = src_e->dest_idx;
 499
 500   for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
 501     {
 502       gphi *phi = gsi.phi ();
 503       tree def = gimple_phi_arg_def (phi, src_indx);
 504       source_location locus = gimple_phi_arg_location (phi, src_indx);
 505
 506       if (TREE_CODE (def) == SSA_NAME
 507           && !virtual_operand_p (gimple_phi_result (phi)))
 508         def = get_value_locus_in_path (def, path, bb, idx, &locus);
 509
 510       add_phi_arg (phi, def, tgt_e, locus);
 511     }
 512 }
 513
 514 /* We have recently made a copy of ORIG_BB, including its outgoing
 515    edges.  The copy is NEW_BB.  Every PHI node in every direct successor of
 516    ORIG_BB has a new argument associated with edge from NEW_BB to the
 517    successor.  Initialize the PHI argument so that it is equal to the PHI
 518    argument associated with the edge from ORIG_BB to the successor.
 519    PATH and IDX are used to check if the new PHI argument has constant
 520    value in a flow sensitive manner.  */
 521
 522 static void
 523 update_destination_phis (basic_block orig_bb, basic_block new_bb,
 524                          vec<jump_thread_edge *> *path, int idx)
 525 {
 526   edge_iterator ei;
 527   edge e;
 528
 529   FOR_EACH_EDGE (e, ei, orig_bb->succs)
 530     {
 531       edge e2 = find_edge (new_bb, e->dest);
 532       copy_phi_args (e->dest, e, e2, path, idx);
 533     }
 534 }
 535
 536 /* Given a duplicate block and its single destination (both stored
 537    in RD).  Create an edge between the duplicate and its single
 538    destination.
 539
 540    Add an additional argument to any PHI nodes at the single
 541    destination.  IDX is the start node in jump threading path
 542    we start to check to see if the new PHI argument has constant
 543    value along the jump threading path.  */
 544
 545 static void
 546 create_edge_and_update_destination_phis (struct redirection_data *rd,
 547                                          basic_block bb, int idx)
 548 {
 549   edge e = make_edge (bb, rd->path->last ()->e->dest, EDGE_FALLTHRU);
 550
 551   rescan_loop_exit (e, true, false);
 552   e->probability = REG_BR_PROB_BASE;
 553   e->count = bb->count;
 554
 555   /* We used to copy the thread path here.  That was added in 2007
 556      and dutifully updated through the representation changes in 2013.
 557
 558      In 2013 we added code to thread from an interior node through
 559      the backedge to another interior node.  That runs after the code
 560      to thread through loop headers from outside the loop.
 561
 562      The latter may delete edges in the CFG, including those
 563      which appeared in the jump threading path we copied here.  Thus
 564      we'd end up using a dangling pointer.
 565
 566      After reviewing the 2007/2011 code, I can't see how anything
 567      depended on copying the AUX field and clearly copying the jump
 568      threading path is problematical due to embedded edge pointers.
 569      It has been removed.  */
 570   e->aux = NULL;
 571
 572   /* If there are any PHI nodes at the destination of the outgoing edge
 573      from the duplicate block, then we will need to add a new argument
 574      to them.  The argument should have the same value as the argument
 575      associated with the outgoing edge stored in RD.  */
 576   copy_phi_args (e->dest, rd->path->last ()->e, e, rd->path, idx);
 577 }
 578
 579 /* Look through PATH beginning at START and return TRUE if there are
 580    any additional blocks that need to be duplicated.  Otherwise,
 581    return FALSE.  */
 582 static bool
 583 any_remaining_duplicated_blocks (vec<jump_thread_edge *> *path,
 584                                  unsigned int start)
 585 {
 586   for (unsigned int i = start + 1; i < path->length (); i++)
 587     {
 588       if ((*path)[i]->type == EDGE_COPY_SRC_JOINER_BLOCK
 589           || (*path)[i]->type == EDGE_COPY_SRC_BLOCK)
 590         return true;
 591     }
 592   return false;
 593 }
 594
 595
 596 /* Compute the amount of profile count/frequency coming into the jump threading
 597    path stored in RD that we are duplicating, returned in PATH_IN_COUNT_PTR and
 598    PATH_IN_FREQ_PTR, as well as the amount of counts flowing out of the
 599    duplicated path, returned in PATH_OUT_COUNT_PTR.  LOCAL_INFO is used to
 600    identify blocks duplicated for jump threading, which have duplicated
 601    edges that need to be ignored in the analysis.  Return true if path contains
 602    a joiner, false otherwise.
 603
 604    In the non-joiner case, this is straightforward - all the counts/frequency
 605    flowing into the jump threading path should flow through the duplicated
 606    block and out of the duplicated path.
 607
 608    In the joiner case, it is very tricky.  Some of the counts flowing into
 609    the original path go offpath at the joiner.  The problem is that while
 610    we know how much total count goes off-path in the original control flow,
 611    we don't know how many of the counts corresponding to just the jump
 612    threading path go offpath at the joiner.
 613
 614    For example, assume we have the following control flow and identified
 615    jump threading paths:
 616
 617                 A     B     C
 618                  \    |    /
 619                Ea \   |Eb / Ec
 620                    \  |  /
 621                     v v v
 622                       J       <-- Joiner
 623                      / \
 624                 Eoff/   \Eon
 625                    /     \
 626                   v       v
 627                 Soff     Son  <--- Normal
 628                          /\
 629                       Ed/  \ Ee
 630                        /    \
 631                       v     v
 632                       D      E
 633
 634             Jump threading paths: A -> J -> Son -> D (path 1)
 635                                   C -> J -> Son -> E (path 2)
 636
 637    Note that the control flow could be more complicated:
 638    - Each jump threading path may have more than one incoming edge.  I.e. A and
 639    Ea could represent multiple incoming blocks/edges that are included in
 640    path 1.
 641    - There could be EDGE_NO_COPY_SRC_BLOCK edges after the joiner (either
 642    before or after the "normal" copy block).  These are not duplicated onto
 643    the jump threading path, as they are single-successor.
 644    - Any of the blocks along the path may have other incoming edges that
 645    are not part of any jump threading path, but add profile counts along
 646    the path.
 647
 648    In the above example, after all jump threading is complete, we will
 649    end up with the following control flow:
 650
 651                 A          B           C
 652                 |          |           |
 653               Ea|          |Eb         |Ec
 654                 |          |           |
 655                 v          v           v
 656                Ja          J          Jc
 657                / \        / \Eon'     / \
 658           Eona/   \   ---/---\--------   \Eonc
 659              /     \ /  /     \           \
 660             v       v  v       v          v
 661            Sona     Soff      Son       Sonc
 662              \                 /\         /
 663               \___________    /  \  _____/
 664                           \  /    \/
 665                            vv      v
 666                             D      E
 667
 668    The main issue to notice here is that when we are processing path 1
 669    (A->J->Son->D) we need to figure out the outgoing edge weights to
 670    the duplicated edges Ja->Sona and Ja->Soff, while ensuring that the
 671    sum of the incoming weights to D remain Ed.  The problem with simply
 672    assuming that Ja (and Jc when processing path 2) has the same outgoing
 673    probabilities to its successors as the original block J, is that after
 674    all paths are processed and other edges/counts removed (e.g. none
 675    of Ec will reach D after processing path 2), we may end up with not
 676    enough count flowing along duplicated edge Sona->D.
 677
 678    Therefore, in the case of a joiner, we keep track of all counts
 679    coming in along the current path, as well as from predecessors not
 680    on any jump threading path (Eb in the above example).  While we
 681    first assume that the duplicated Eona for Ja->Sona has the same
 682    probability as the original, we later compensate for other jump
 683    threading paths that may eliminate edges.  We do that by keep track
 684    of all counts coming into the original path that are not in a jump
 685    thread (Eb in the above example, but as noted earlier, there could
 686    be other predecessors incoming to the path at various points, such
 687    as at Son).  Call this cumulative non-path count coming into the path
 688    before D as Enonpath.  We then ensure that the count from Sona->D is as at
 689    least as big as (Ed - Enonpath), but no bigger than the minimum
 690    weight along the jump threading path.  The probabilities of both the
 691    original and duplicated joiner block J and Ja will be adjusted
 692    accordingly after the updates.  */
 693
 694 static bool
 695 compute_path_counts (struct redirection_data *rd,
 696                      ssa_local_info_t *local_info,
 697                      profile_count *path_in_count_ptr,
 698                      profile_count *path_out_count_ptr,
 699                      int *path_in_freq_ptr)
 700 {
 701   edge e = rd->incoming_edges->e;
 702   vec<jump_thread_edge *> *path = THREAD_PATH (e);
 703   edge elast = path->last ()->e;
 704   profile_count nonpath_count = profile_count::zero ();
 705   bool has_joiner = false;
 706   profile_count path_in_count = profile_count::zero ();
 707   int path_in_freq = 0;
 708
 709   /* Start by accumulating incoming edge counts to the path's first bb
 710      into a couple buckets:
 711         path_in_count: total count of incoming edges that flow into the
 712                   current path.
 713         nonpath_count: total count of incoming edges that are not
 714                   flowing along *any* path.  These are the counts
 715                   that will still flow along the original path after
 716                   all path duplication is done by potentially multiple
 717                   calls to this routine.
 718      (any other incoming edge counts are for a different jump threading
 719      path that will be handled by a later call to this routine.)
 720      To make this easier, start by recording all incoming edges that flow into
 721      the current path in a bitmap.  We could add up the path's incoming edge
 722      counts here, but we still need to walk all the first bb's incoming edges
 723      below to add up the counts of the other edges not included in this jump
 724      threading path.  */
 725   struct el *next, *el;
 726   auto_bitmap in_edge_srcs;
 727   for (el = rd->incoming_edges; el; el = next)
 728     {
 729       next = el->next;
 730       bitmap_set_bit (in_edge_srcs, el->e->src->index);
 731     }
 732   edge ein;
 733   edge_iterator ei;
 734   FOR_EACH_EDGE (ein, ei, e->dest->preds)
 735     {
 736       vec<jump_thread_edge *> *ein_path = THREAD_PATH (ein);
 737       /* Simply check the incoming edge src against the set captured above.  */
 738       if (ein_path
 739           && bitmap_bit_p (in_edge_srcs, (*ein_path)[0]->e->src->index))
 740         {
 741           /* It is necessary but not sufficient that the last path edges
 742              are identical.  There may be different paths that share the
 743              same last path edge in the case where the last edge has a nocopy
 744              source block.  */
 745           gcc_assert (ein_path->last ()->e == elast);
 746           path_in_count += ein->count;
 747           path_in_freq += EDGE_FREQUENCY (ein);
 748         }
 749       else if (!ein_path)
 750         {
 751           /* Keep track of the incoming edges that are not on any jump-threading
 752              path.  These counts will still flow out of original path after all
 753              jump threading is complete.  */
 754             nonpath_count += ein->count;
 755         }
 756     }
 757
 758   /* This is needed due to insane incoming frequencies.  */
 759   if (path_in_freq > BB_FREQ_MAX)
 760     path_in_freq = BB_FREQ_MAX;
 761
 762   /* Now compute the fraction of the total count coming into the first
 763      path bb that is from the current threading path.  */
 764   profile_count total_count = e->dest->count;
 765   /* Handle incoming profile insanities.  */
 766   if (total_count < path_in_count)
 767     path_in_count = total_count;
 768   int onpath_scale = path_in_count.probability_in (total_count);
 769
 770   /* Walk the entire path to do some more computation in order to estimate
 771      how much of the path_in_count will flow out of the duplicated threading
 772      path.  In the non-joiner case this is straightforward (it should be
 773      the same as path_in_count, although we will handle incoming profile
 774      insanities by setting it equal to the minimum count along the path).
 775
 776      In the joiner case, we need to estimate how much of the path_in_count
 777      will stay on the threading path after the joiner's conditional branch.
 778      We don't really know for sure how much of the counts
 779      associated with this path go to each successor of the joiner, but we'll
 780      estimate based on the fraction of the total count coming into the path
 781      bb was from the threading paths (computed above in onpath_scale).
 782      Afterwards, we will need to do some fixup to account for other threading
 783      paths and possible profile insanities.
 784
 785      In order to estimate the joiner case's counts we also need to update
 786      nonpath_count with any additional counts coming into the path.  Other
 787      blocks along the path may have additional predecessors from outside
 788      the path.  */
 789   profile_count path_out_count = path_in_count;
 790   profile_count min_path_count = path_in_count;
 791   for (unsigned int i = 1; i < path->length (); i++)
 792     {
 793       edge epath = (*path)[i]->e;
 794       profile_count cur_count = epath->count;
 795       if ((*path)[i]->type == EDGE_COPY_SRC_JOINER_BLOCK)
 796         {
 797           has_joiner = true;
 798           cur_count = cur_count.apply_probability (onpath_scale);
 799         }
 800       /* In the joiner case we need to update nonpath_count for any edges
 801          coming into the path that will contribute to the count flowing
 802          into the path successor.  */
 803       if (has_joiner && epath != elast)
 804         {
 805           /* Look for other incoming edges after joiner.  */
 806           FOR_EACH_EDGE (ein, ei, epath->dest->preds)
 807             {
 808               if (ein != epath
 809                   /* Ignore in edges from blocks we have duplicated for a
 810                      threading path, which have duplicated edge counts until
 811                      they are redirected by an invocation of this routine.  */
 812                   && !bitmap_bit_p (local_info->duplicate_blocks,
 813                                     ein->src->index))
 814                 nonpath_count += ein->count;
 815             }
 816         }
 817       if (cur_count < path_out_count)
 818         path_out_count = cur_count;
 819       if (epath->count < min_path_count)
 820         min_path_count = epath->count;
 821     }
 822
 823   /* We computed path_out_count above assuming that this path targeted
 824      the joiner's on-path successor with the same likelihood as it
 825      reached the joiner.  However, other thread paths through the joiner
 826      may take a different path through the normal copy source block
 827      (i.e. they have a different elast), meaning that they do not
 828      contribute any counts to this path's elast.  As a result, it may
 829      turn out that this path must have more count flowing to the on-path
 830      successor of the joiner.  Essentially, all of this path's elast
 831      count must be contributed by this path and any nonpath counts
 832      (since any path through the joiner with a different elast will not
 833      include a copy of this elast in its duplicated path).
 834      So ensure that this path's path_out_count is at least the
 835      difference between elast->count and nonpath_count.  Otherwise the edge
 836      counts after threading will not be sane.  */
 837   if (local_info->need_profile_correction
 838       && has_joiner && path_out_count < elast->count - nonpath_count)
 839     {
 840       path_out_count = elast->count - nonpath_count;
 841       /* But neither can we go above the minimum count along the path
 842          we are duplicating.  This can be an issue due to profile
 843          insanities coming in to this pass.  */
 844       if (path_out_count > min_path_count)
 845         path_out_count = min_path_count;
 846     }
 847
 848   *path_in_count_ptr = path_in_count;
 849   *path_out_count_ptr = path_out_count;
 850   *path_in_freq_ptr = path_in_freq;
 851   return has_joiner;
 852 }
 853
 854
 855 /* Update the counts and frequencies for both an original path
 856    edge EPATH and its duplicate EDUP.  The duplicate source block
 857    will get a count/frequency of PATH_IN_COUNT and PATH_IN_FREQ,
 858    and the duplicate edge EDUP will have a count of PATH_OUT_COUNT.  */
 859 static void
 860 update_profile (edge epath, edge edup, profile_count path_in_count,
 861                 profile_count path_out_count, int path_in_freq)
 862 {
 863
 864   /* First update the duplicated block's count / frequency.  */
 865   if (edup)
 866     {
 867       basic_block dup_block = edup->src;
 868       gcc_assert (!dup_block->count.initialized_p ());
 869       gcc_assert (dup_block->frequency == 0);
 870       dup_block->count = path_in_count;
 871       dup_block->frequency = path_in_freq;
 872     }
 873
 874   /* Now update the original block's count and frequency in the
 875      opposite manner - remove the counts/freq that will flow
 876      into the duplicated block.  Handle underflow due to precision/
 877      rounding issues.  */
 878   epath->src->count -= path_in_count;
 879   epath->src->frequency -= path_in_freq;
 880   if (epath->src->frequency < 0)
 881     epath->src->frequency = 0;
 882
 883   /* Next update this path edge's original and duplicated counts.  We know
 884      that the duplicated path will have path_out_count flowing
 885      out of it (in the joiner case this is the count along the duplicated path
 886      out of the duplicated joiner).  This count can then be removed from the
 887      original path edge.  */
 888   if (edup)
 889     edup->count = path_out_count;
 890   epath->count -= path_out_count;
 891   /* FIXME: can epath->count be legally uninitialized here?  */
 892 }
 893
 894
 895 /* The duplicate and original joiner blocks may end up with different
 896    probabilities (different from both the original and from each other).
 897    Recompute the probabilities here once we have updated the edge
 898    counts and frequencies.  */
 899
 900 static void
 901 recompute_probabilities (basic_block bb)
 902 {
 903   edge esucc;
 904   edge_iterator ei;
 905   FOR_EACH_EDGE (esucc, ei, bb->succs)
 906     {
 907       if (!(bb->count > 0))
 908         continue;
 909
 910       /* Prevent overflow computation due to insane profiles.  */
 911       if (esucc->count < bb->count)
 912         esucc->probability = esucc->count.probability_in (bb->count);
 913       else
 914         /* Can happen with missing/guessed probabilities, since we
 915            may determine that more is flowing along duplicated
 916            path than joiner succ probabilities allowed.
 917            Counts and freqs will be insane after jump threading,
 918            at least make sure probability is sane or we will
 919            get a flow verification error.
 920            Not much we can do to make counts/freqs sane without
 921            redoing the profile estimation.  */
 922         esucc->probability = REG_BR_PROB_BASE;
 923     }
 924 }
 925
 926
 927 /* Update the counts of the original and duplicated edges from a joiner
 928    that go off path, given that we have already determined that the
 929    duplicate joiner DUP_BB has incoming count PATH_IN_COUNT and
 930    outgoing count along the path PATH_OUT_COUNT.  The original (on-)path
 931    edge from joiner is EPATH.  */
 932
 933 static void
 934 update_joiner_offpath_counts (edge epath, basic_block dup_bb,
 935                               profile_count path_in_count,
 936                               profile_count path_out_count)
 937 {
 938   /* Compute the count that currently flows off path from the joiner.
 939      In other words, the total count of joiner's out edges other than
 940      epath.  Compute this by walking the successors instead of
 941      subtracting epath's count from the joiner bb count, since there
 942      are sometimes slight insanities where the total out edge count is
 943      larger than the bb count (possibly due to rounding/truncation
 944      errors).  */
 945   profile_count total_orig_off_path_count = profile_count::zero ();
 946   edge enonpath;
 947   edge_iterator ei;
 948   FOR_EACH_EDGE (enonpath, ei, epath->src->succs)
 949     {
 950       if (enonpath == epath)
 951         continue;
 952       total_orig_off_path_count += enonpath->count;
 953     }
 954
 955   /* For the path that we are duplicating, the amount that will flow
 956      off path from the duplicated joiner is the delta between the
 957      path's cumulative in count and the portion of that count we
 958      estimated above as flowing from the joiner along the duplicated
 959      path.  */
 960   profile_count total_dup_off_path_count = path_in_count - path_out_count;
 961
 962   /* Now do the actual updates of the off-path edges.  */
 963   FOR_EACH_EDGE (enonpath, ei, epath->src->succs)
 964     {
 965       /* Look for edges going off of the threading path.  */
 966       if (enonpath == epath)
 967         continue;
 968
 969       /* Find the corresponding edge out of the duplicated joiner.  */
 970       edge enonpathdup = find_edge (dup_bb, enonpath->dest);
 971       gcc_assert (enonpathdup);
 972
 973       /* We can't use the original probability of the joiner's out
 974          edges, since the probabilities of the original branch
 975          and the duplicated branches may vary after all threading is
 976          complete.  But apportion the duplicated joiner's off-path
 977          total edge count computed earlier (total_dup_off_path_count)
 978          among the duplicated off-path edges based on their original
 979          ratio to the full off-path count (total_orig_off_path_count).
 980          */
 981       int scale = enonpath->count.probability_in (total_orig_off_path_count);
 982       /* Give the duplicated offpath edge a portion of the duplicated
 983          total.  */
 984       enonpathdup->count = total_dup_off_path_count.apply_probability (scale);
 985       /* Now update the original offpath edge count, handling underflow
 986          due to rounding errors.  */
 987       enonpath->count -= enonpathdup->count;
 988     }
 989 }
 990
 991
 992 /* Check if the paths through RD all have estimated frequencies but zero
 993    profile counts.  This is more accurate than checking the entry block
 994    for a zero profile count, since profile insanities sometimes creep in.  */
 995
 996 static bool
 997 estimated_freqs_path (struct redirection_data *rd)
 998 {
 999   edge e = rd->incoming_edges->e;
1000   vec<jump_thread_edge *> *path = THREAD_PATH (e);
1001   edge ein;
1002   edge_iterator ei;
1003   bool non_zero_freq = false;
1004   FOR_EACH_EDGE (ein, ei, e->dest->preds)
1005     {
1006       if (ein->count > 0)
1007         return false;
1008       non_zero_freq |= ein->src->frequency != 0;
1009     }
1010
1011   for (unsigned int i = 1; i < path->length (); i++)
1012     {
1013       edge epath = (*path)[i]->e;
1014       if (epath->src->count > 0)
1015         return false;
1016       non_zero_freq |= epath->src->frequency != 0;
1017       edge esucc;
1018       FOR_EACH_EDGE (esucc, ei, epath->src->succs)
1019         {
1020           if (esucc->count > 0)
1021             return false;
1022           non_zero_freq |= esucc->src->frequency != 0;
1023         }
1024     }
1025   return non_zero_freq;
1026 }
1027
1028
1029 /* Invoked for routines that have guessed frequencies and no profile
1030    counts to record the block and edge frequencies for paths through RD
1031    in the profile count fields of those blocks and edges.  This is because
1032    ssa_fix_duplicate_block_edges incrementally updates the block and
1033    edge counts as edges are redirected, and it is difficult to do that
1034    for edge frequencies which are computed on the fly from the source
1035    block frequency and probability.  When a block frequency is updated
1036    its outgoing edge frequencies are affected and become difficult to
1037    adjust.  */
1038
1039 static void
1040 freqs_to_counts_path (struct redirection_data *rd)
1041 {
1042   edge e = rd->incoming_edges->e;
1043   vec<jump_thread_edge *> *path = THREAD_PATH (e);
1044   edge ein;
1045   edge_iterator ei;
1046   FOR_EACH_EDGE (ein, ei, e->dest->preds)
1047     {
1048       /* Scale up the frequency by REG_BR_PROB_BASE, to avoid rounding
1049          errors applying the probability when the frequencies are very
1050          small.  */
1051       ein->count = profile_count::from_gcov_type
1052                 (apply_probability (ein->src->frequency * REG_BR_PROB_BASE,
1053                                       ein->probability));
1054     }
1055
1056   for (unsigned int i = 1; i < path->length (); i++)
1057     {
1058       edge epath = (*path)[i]->e;
1059       edge esucc;
1060       /* Scale up the frequency by REG_BR_PROB_BASE, to avoid rounding
1061          errors applying the edge probability when the frequencies are very
1062          small.  */
1063       epath->src->count =
1064         profile_count::from_gcov_type
1065           (epath->src->frequency * REG_BR_PROB_BASE);
1066       FOR_EACH_EDGE (esucc, ei, epath->src->succs)
1067         esucc->count =
1068            esucc->src->count.apply_probability (esucc->probability);
1069     }
1070 }
1071
1072
1073 /* For routines that have guessed frequencies and no profile counts, where we
1074    used freqs_to_counts_path to record block and edge frequencies for paths
1075    through RD, we clear the counts after completing all updates for RD.
1076    The updates in ssa_fix_duplicate_block_edges are based off the count fields,
1077    but the block frequencies and edge probabilities were updated as well,
1078    so we can simply clear the count fields.  */
1079
1080 static void
1081 clear_counts_path (struct redirection_data *rd)
1082 {
1083   edge e = rd->incoming_edges->e;
1084   vec<jump_thread_edge *> *path = THREAD_PATH (e);
1085   edge ein, esucc;
1086   edge_iterator ei;
1087   profile_count val = profile_count::uninitialized ();
1088   if (profile_status_for_fn (cfun) == PROFILE_READ)
1089     val = profile_count::zero ();
1090
1091   FOR_EACH_EDGE (ein, ei, e->dest->preds)
1092     ein->count = val;
1093
1094   /* First clear counts along original path.  */
1095   for (unsigned int i = 1; i < path->length (); i++)
1096     {
1097       edge epath = (*path)[i]->e;
1098       FOR_EACH_EDGE (esucc, ei, epath->src->succs)
1099         esucc->count = val;
1100       epath->src->count = val;
1101     }
1102   /* Also need to clear the counts along duplicated path.  */
1103   for (unsigned int i = 0; i < 2; i++)
1104     {
1105       basic_block dup = rd->dup_blocks[i];
1106       if (!dup)
1107         continue;
1108       FOR_EACH_EDGE (esucc, ei, dup->succs)
1109         esucc->count = val;
1110       dup->count = val;
1111     }
1112 }
1113
1114 /* Wire up the outgoing edges from the duplicate blocks and
1115    update any PHIs as needed.  Also update the profile counts
1116    on the original and duplicate blocks and edges.  */
1117 void
1118 ssa_fix_duplicate_block_edges (struct redirection_data *rd,
1119                                ssa_local_info_t *local_info)
1120 {
1121   bool multi_incomings = (rd->incoming_edges->next != NULL);
1122   edge e = rd->incoming_edges->e;
1123   vec<jump_thread_edge *> *path = THREAD_PATH (e);
1124   edge elast = path->last ()->e;
1125   profile_count path_in_count = profile_count::zero ();
1126   profile_count path_out_count = profile_count::zero ();
1127   int path_in_freq = 0;
1128
1129   /* This routine updates profile counts, frequencies, and probabilities
1130      incrementally. Since it is difficult to do the incremental updates
1131      using frequencies/probabilities alone, for routines without profile
1132      data we first take a snapshot of the existing block and edge frequencies
1133      by copying them into the empty profile count fields.  These counts are
1134      then used to do the incremental updates, and cleared at the end of this
1135      routine.  If the function is marked as having a profile, we still check
1136      to see if the paths through RD are using estimated frequencies because
1137      the routine had zero profile counts.  */
1138   bool do_freqs_to_counts = (profile_status_for_fn (cfun) != PROFILE_READ
1139                              || estimated_freqs_path (rd));
1140   if (do_freqs_to_counts)
1141     freqs_to_counts_path (rd);
1142
1143   /* First determine how much profile count to move from original
1144      path to the duplicate path.  This is tricky in the presence of
1145      a joiner (see comments for compute_path_counts), where some portion
1146      of the path's counts will flow off-path from the joiner.  In the
1147      non-joiner case the path_in_count and path_out_count should be the
1148      same.  */
1149   bool has_joiner = compute_path_counts (rd, local_info,
1150                                          &path_in_count, &path_out_count,
1151                                          &path_in_freq);
1152
1153   int cur_path_freq = path_in_freq;
1154   for (unsigned int count = 0, i = 1; i < path->length (); i++)
1155     {
1156       edge epath = (*path)[i]->e;
1157
1158       /* If we were threading through an joiner block, then we want
1159          to keep its control statement and redirect an outgoing edge.
1160          Else we want to remove the control statement & edges, then create
1161          a new outgoing edge.  In both cases we may need to update PHIs.  */
1162       if ((*path)[i]->type == EDGE_COPY_SRC_JOINER_BLOCK)
1163         {
1164           edge victim;
1165           edge e2;
1166
1167           gcc_assert (has_joiner);
1168
1169           /* This updates the PHIs at the destination of the duplicate
1170              block.  Pass 0 instead of i if we are threading a path which
1171              has multiple incoming edges.  */
1172           update_destination_phis (local_info->bb, rd->dup_blocks[count],
1173                                    path, multi_incomings ? 0 : i);
1174
1175           /* Find the edge from the duplicate block to the block we're
1176              threading through.  That's the edge we want to redirect.  */
1177           victim = find_edge (rd->dup_blocks[count], (*path)[i]->e->dest);
1178
1179           /* If there are no remaining blocks on the path to duplicate,
1180              then redirect VICTIM to the final destination of the jump
1181              threading path.  */
1182           if (!any_remaining_duplicated_blocks (path, i))
1183             {
1184               e2 = redirect_edge_and_branch (victim, elast->dest);
1185               /* If we redirected the edge, then we need to copy PHI arguments
1186                  at the target.  If the edge already existed (e2 != victim
1187                  case), then the PHIs in the target already have the correct
1188                  arguments.  */
1189               if (e2 == victim)
1190                 copy_phi_args (e2->dest, elast, e2,
1191                                path, multi_incomings ? 0 : i);
1192             }
1193           else
1194             {
1195               /* Redirect VICTIM to the next duplicated block in the path.  */
1196               e2 = redirect_edge_and_branch (victim, rd->dup_blocks[count + 1]);
1197
1198               /* We need to update the PHIs in the next duplicated block.  We
1199                  want the new PHI args to have the same value as they had
1200                  in the source of the next duplicate block.
1201
1202                  Thus, we need to know which edge we traversed into the
1203                  source of the duplicate.  Furthermore, we may have
1204                  traversed many edges to reach the source of the duplicate.
1205
1206                  Walk through the path starting at element I until we
1207                  hit an edge marked with EDGE_COPY_SRC_BLOCK.  We want
1208                  the edge from the prior element.  */
1209               for (unsigned int j = i + 1; j < path->length (); j++)
1210                 {
1211                   if ((*path)[j]->type == EDGE_COPY_SRC_BLOCK)
1212                     {
1213                       copy_phi_arg_into_existing_phi ((*path)[j - 1]->e, e2);
1214                       break;
1215                     }
1216                 }
1217             }
1218
1219           /* Update the counts and frequency of both the original block
1220              and path edge, and the duplicates.  The path duplicate's
1221              incoming count and frequency are the totals for all edges
1222              incoming to this jump threading path computed earlier.
1223              And we know that the duplicated path will have path_out_count
1224              flowing out of it (i.e. along the duplicated path out of the
1225              duplicated joiner).  */
1226           update_profile (epath, e2, path_in_count, path_out_count,
1227                           path_in_freq);
1228
1229           /* Next we need to update the counts of the original and duplicated
1230              edges from the joiner that go off path.  */
1231           update_joiner_offpath_counts (epath, e2->src, path_in_count,
1232                                         path_out_count);
1233
1234           /* Finally, we need to set the probabilities on the duplicated
1235              edges out of the duplicated joiner (e2->src).  The probabilities
1236              along the original path will all be updated below after we finish
1237              processing the whole path.  */
1238           recompute_probabilities (e2->src);
1239
1240           /* Record the frequency flowing to the downstream duplicated
1241              path blocks.  */
1242           cur_path_freq = EDGE_FREQUENCY (e2);
1243         }
1244       else if ((*path)[i]->type == EDGE_COPY_SRC_BLOCK)
1245         {
1246           remove_ctrl_stmt_and_useless_edges (rd->dup_blocks[count], NULL);
1247           create_edge_and_update_destination_phis (rd, rd->dup_blocks[count],
1248                                                    multi_incomings ? 0 : i);
1249           if (count == 1)
1250             single_succ_edge (rd->dup_blocks[1])->aux = NULL;
1251
1252           /* Update the counts and frequency of both the original block
1253              and path edge, and the duplicates.  Since we are now after
1254              any joiner that may have existed on the path, the count
1255              flowing along the duplicated threaded path is path_out_count.
1256              If we didn't have a joiner, then cur_path_freq was the sum
1257              of the total frequencies along all incoming edges to the
1258              thread path (path_in_freq).  If we had a joiner, it would have
1259              been updated at the end of that handling to the edge frequency
1260              along the duplicated joiner path edge.  */
1261           update_profile (epath, EDGE_SUCC (rd->dup_blocks[count], 0),
1262                           path_out_count, path_out_count,
1263                           cur_path_freq);
1264         }
1265       else
1266         {
1267           /* No copy case.  In this case we don't have an equivalent block
1268              on the duplicated thread path to update, but we do need
1269              to remove the portion of the counts/freqs that were moved
1270              to the duplicated path from the counts/freqs flowing through
1271              this block on the original path.  Since all the no-copy edges
1272              are after any joiner, the removed count is the same as
1273              path_out_count.
1274
1275              If we didn't have a joiner, then cur_path_freq was the sum
1276              of the total frequencies along all incoming edges to the
1277              thread path (path_in_freq).  If we had a joiner, it would have
1278              been updated at the end of that handling to the edge frequency
1279              along the duplicated joiner path edge.  */
1280            update_profile (epath, NULL, path_out_count, path_out_count,
1281                            cur_path_freq);
1282         }
1283
1284       /* Increment the index into the duplicated path when we processed
1285          a duplicated block.  */
1286       if ((*path)[i]->type == EDGE_COPY_SRC_JOINER_BLOCK
1287           || (*path)[i]->type == EDGE_COPY_SRC_BLOCK)
1288         {
1289           count++;
1290         }
1291     }
1292
1293   /* Now walk orig blocks and update their probabilities, since the
1294      counts and freqs should be updated properly by above loop.  */
1295   for (unsigned int i = 1; i < path->length (); i++)
1296     {
1297       edge epath = (*path)[i]->e;
1298       recompute_probabilities (epath->src);
1299     }
1300
1301   /* Done with all profile and frequency updates, clear counts if they
1302      were copied.  */
1303   if (do_freqs_to_counts)
1304     clear_counts_path (rd);
1305 }
1306
1307 /* Hash table traversal callback routine to create duplicate blocks.  */
1308
1309 int
1310 ssa_create_duplicates (struct redirection_data **slot,
1311                        ssa_local_info_t *local_info)
1312 {
1313   struct redirection_data *rd = *slot;
1314
1315   /* The second duplicated block in a jump threading path is specific
1316      to the path.  So it gets stored in RD rather than in LOCAL_DATA.
1317
1318      Each time we're called, we have to look through the path and see
1319      if a second block needs to be duplicated.
1320
1321      Note the search starts with the third edge on the path.  The first
1322      edge is the incoming edge, the second edge always has its source
1323      duplicated.  Thus we start our search with the third edge.  */
1324   vec<jump_thread_edge *> *path = rd->path;
1325   for (unsigned int i = 2; i < path->length (); i++)
1326     {
1327       if ((*path)[i]->type == EDGE_COPY_SRC_BLOCK
1328           || (*path)[i]->type == EDGE_COPY_SRC_JOINER_BLOCK)
1329         {
1330           create_block_for_threading ((*path)[i]->e->src, rd, 1,
1331                                       &local_info->duplicate_blocks);
1332           break;
1333         }
1334     }
1335
1336   /* Create a template block if we have not done so already.  Otherwise
1337      use the template to create a new block.  */
1338   if (local_info->template_block == NULL)
1339     {
1340       create_block_for_threading ((*path)[1]->e->src, rd, 0,
1341                                   &local_info->duplicate_blocks);
1342       local_info->template_block = rd->dup_blocks[0];
1343
1344       /* We do not create any outgoing edges for the template.  We will
1345          take care of that in a later traversal.  That way we do not
1346          create edges that are going to just be deleted.  */
1347     }
1348   else
1349     {
1350       create_block_for_threading (local_info->template_block, rd, 0,
1351                                   &local_info->duplicate_blocks);
1352
1353       /* Go ahead and wire up outgoing edges and update PHIs for the duplicate
1354          block.   */
1355       ssa_fix_duplicate_block_edges (rd, local_info);
1356     }
1357
1358   /* Keep walking the hash table.  */
1359   return 1;
1360 }
1361
1362 /* We did not create any outgoing edges for the template block during
1363    block creation.  This hash table traversal callback creates the
1364    outgoing edge for the template block.  */
1365
1366 inline int
1367 ssa_fixup_template_block (struct redirection_data **slot,
1368                           ssa_local_info_t *local_info)
1369 {
1370   struct redirection_data *rd = *slot;
1371
1372   /* If this is the template block halt the traversal after updating
1373      it appropriately.
1374
1375      If we were threading through an joiner block, then we want
1376      to keep its control statement and redirect an outgoing edge.
1377      Else we want to remove the control statement & edges, then create
1378      a new outgoing edge.  In both cases we may need to update PHIs.  */
1379   if (rd->dup_blocks[0] && rd->dup_blocks[0] == local_info->template_block)
1380     {
1381       ssa_fix_duplicate_block_edges (rd, local_info);
1382       return 0;
1383     }
1384
1385   return 1;
1386 }
1387
1388 /* Hash table traversal callback to redirect each incoming edge
1389    associated with this hash table element to its new destination.  */
1390
1391 int
1392 ssa_redirect_edges (struct redirection_data **slot,
1393                     ssa_local_info_t *local_info)
1394 {
1395   struct redirection_data *rd = *slot;
1396   struct el *next, *el;
1397
1398   /* Walk over all the incoming edges associated with this hash table
1399      entry.  */
1400   for (el = rd->incoming_edges; el; el = next)
1401     {
1402       edge e = el->e;
1403       vec<jump_thread_edge *> *path = THREAD_PATH (e);
1404
1405       /* Go ahead and free this element from the list.  Doing this now
1406          avoids the need for another list walk when we destroy the hash
1407          table.  */
1408       next = el->next;
1409       free (el);
1410
1411       thread_stats.num_threaded_edges++;
1412
1413       if (rd->dup_blocks[0])
1414         {
1415           edge e2;
1416
1417           if (dump_file && (dump_flags & TDF_DETAILS))
1418             fprintf (dump_file, "  Threaded jump %d --> %d to %d\n",
1419                      e->src->index, e->dest->index, rd->dup_blocks[0]->index);
1420
1421           /* Redirect the incoming edge (possibly to the joiner block) to the
1422              appropriate duplicate block.  */
1423           e2 = redirect_edge_and_branch (e, rd->dup_blocks[0]);
1424           gcc_assert (e == e2);
1425           flush_pending_stmts (e2);
1426         }
1427
1428       /* Go ahead and clear E->aux.  It's not needed anymore and failure
1429          to clear it will cause all kinds of unpleasant problems later.  */
1430       delete_jump_thread_path (path);
1431       e->aux = NULL;
1432
1433     }
1434
1435   /* Indicate that we actually threaded one or more jumps.  */
1436   if (rd->incoming_edges)
1437     local_info->jumps_threaded = true;
1438
1439   return 1;
1440 }
1441
1442 /* Return true if this block has no executable statements other than
1443    a simple ctrl flow instruction.  When the number of outgoing edges
1444    is one, this is equivalent to a "forwarder" block.  */
1445
1446 static bool
1447 redirection_block_p (basic_block bb)
1448 {
1449   gimple_stmt_iterator gsi;
1450
1451   /* Advance to the first executable statement.  */
1452   gsi = gsi_start_bb (bb);
1453   while (!gsi_end_p (gsi)
1454          && (gimple_code (gsi_stmt (gsi)) == GIMPLE_LABEL
1455              || is_gimple_debug (gsi_stmt (gsi))
1456              || gimple_nop_p (gsi_stmt (gsi))
1457              || gimple_clobber_p (gsi_stmt (gsi))))
1458     gsi_next (&gsi);
1459
1460   /* Check if this is an empty block.  */
1461   if (gsi_end_p (gsi))
1462     return true;
1463
1464   /* Test that we've reached the terminating control statement.  */
1465   return gsi_stmt (gsi)
1466          && (gimple_code (gsi_stmt (gsi)) == GIMPLE_COND
1467              || gimple_code (gsi_stmt (gsi)) == GIMPLE_GOTO
1468              || gimple_code (gsi_stmt (gsi)) == GIMPLE_SWITCH);
1469 }
1470
1471 /* BB is a block which ends with a COND_EXPR or SWITCH_EXPR and when BB
1472    is reached via one or more specific incoming edges, we know which
1473    outgoing edge from BB will be traversed.
1474
1475    We want to redirect those incoming edges to the target of the
1476    appropriate outgoing edge.  Doing so avoids a conditional branch
1477    and may expose new optimization opportunities.  Note that we have
1478    to update dominator tree and SSA graph after such changes.
1479
1480    The key to keeping the SSA graph update manageable is to duplicate
1481    the side effects occurring in BB so that those side effects still
1482    occur on the paths which bypass BB after redirecting edges.
1483
1484    We accomplish this by creating duplicates of BB and arranging for
1485    the duplicates to unconditionally pass control to one specific
1486    successor of BB.  We then revector the incoming edges into BB to
1487    the appropriate duplicate of BB.
1488
1489    If NOLOOP_ONLY is true, we only perform the threading as long as it
1490    does not affect the structure of the loops in a nontrivial way.
1491
1492    If JOINERS is true, then thread through joiner blocks as well.  */
1493
1494 static bool
1495 thread_block_1 (basic_block bb, bool noloop_only, bool joiners)
1496 {
1497   /* E is an incoming edge into BB that we may or may not want to
1498      redirect to a duplicate of BB.  */
1499   edge e, e2;
1500   edge_iterator ei;
1501   ssa_local_info_t local_info;
1502
1503   local_info.duplicate_blocks = BITMAP_ALLOC (NULL);
1504   local_info.need_profile_correction = false;
1505
1506   /* To avoid scanning a linear array for the element we need we instead
1507      use a hash table.  For normal code there should be no noticeable
1508      difference.  However, if we have a block with a large number of
1509      incoming and outgoing edges such linear searches can get expensive.  */
1510   redirection_data
1511     = new hash_table<struct redirection_data> (EDGE_COUNT (bb->succs));
1512
1513   /* Record each unique threaded destination into a hash table for
1514      efficient lookups.  */
1515   edge last = NULL;
1516   FOR_EACH_EDGE (e, ei, bb->preds)
1517     {
1518       if (e->aux == NULL)
1519         continue;
1520
1521       vec<jump_thread_edge *> *path = THREAD_PATH (e);
1522
1523       if (((*path)[1]->type == EDGE_COPY_SRC_JOINER_BLOCK && !joiners)
1524           || ((*path)[1]->type == EDGE_COPY_SRC_BLOCK && joiners))
1525         continue;
1526
1527       e2 = path->last ()->e;
1528       if (!e2 || noloop_only)
1529         {
1530           /* If NOLOOP_ONLY is true, we only allow threading through the
1531              header of a loop to exit edges.  */
1532
1533           /* One case occurs when there was loop header buried in a jump
1534              threading path that crosses loop boundaries.  We do not try
1535              and thread this elsewhere, so just cancel the jump threading
1536              request by clearing the AUX field now.  */
1537           if (bb->loop_father != e2->src->loop_father
1538               && !loop_exit_edge_p (e2->src->loop_father, e2))
1539             {
1540               /* Since this case is not handled by our special code
1541                  to thread through a loop header, we must explicitly
1542                  cancel the threading request here.  */
1543               delete_jump_thread_path (path);
1544               e->aux = NULL;
1545               continue;
1546             }
1547
1548           /* Another case occurs when trying to thread through our
1549              own loop header, possibly from inside the loop.  We will
1550              thread these later.  */
1551           unsigned int i;
1552           for (i = 1; i < path->length (); i++)
1553             {
1554               if ((*path)[i]->e->src == bb->loop_father->header
1555                   && (!loop_exit_edge_p (bb->loop_father, e2)
1556                       || (*path)[1]->type == EDGE_COPY_SRC_JOINER_BLOCK))
1557                 break;
1558             }
1559
1560           if (i != path->length ())
1561             continue;
1562         }
1563
1564       /* Insert the outgoing edge into the hash table if it is not
1565          already in the hash table.  */
1566       lookup_redirection_data (e, INSERT);
1567
1568       /* When we have thread paths through a common joiner with different
1569          final destinations, then we may need corrections to deal with
1570          profile insanities.  See the big comment before compute_path_counts.  */
1571       if ((*path)[1]->type == EDGE_COPY_SRC_JOINER_BLOCK)
1572         {
1573           if (!last)
1574             last = e2;
1575           else if (e2 != last)
1576             local_info.need_profile_correction = true;
1577         }
1578     }
1579
1580   /* We do not update dominance info.  */
1581   free_dominance_info (CDI_DOMINATORS);
1582
1583   /* We know we only thread through the loop header to loop exits.
1584      Let the basic block duplication hook know we are not creating
1585      a multiple entry loop.  */
1586   if (noloop_only
1587       && bb == bb->loop_father->header)
1588     set_loop_copy (bb->loop_father, loop_outer (bb->loop_father));
1589
1590   /* Now create duplicates of BB.
1591
1592      Note that for a block with a high outgoing degree we can waste
1593      a lot of time and memory creating and destroying useless edges.
1594
1595      So we first duplicate BB and remove the control structure at the
1596      tail of the duplicate as well as all outgoing edges from the
1597      duplicate.  We then use that duplicate block as a template for
1598      the rest of the duplicates.  */
1599   local_info.template_block = NULL;
1600   local_info.bb = bb;
1601   local_info.jumps_threaded = false;
1602   redirection_data->traverse <ssa_local_info_t *, ssa_create_duplicates>
1603                             (&local_info);
1604
1605   /* The template does not have an outgoing edge.  Create that outgoing
1606      edge and update PHI nodes as the edge's target as necessary.
1607
1608      We do this after creating all the duplicates to avoid creating
1609      unnecessary edges.  */
1610   redirection_data->traverse <ssa_local_info_t *, ssa_fixup_template_block>
1611                             (&local_info);
1612
1613   /* The hash table traversals above created the duplicate blocks (and the
1614      statements within the duplicate blocks).  This loop creates PHI nodes for
1615      the duplicated blocks and redirects the incoming edges into BB to reach
1616      the duplicates of BB.  */
1617   redirection_data->traverse <ssa_local_info_t *, ssa_redirect_edges>
1618                             (&local_info);
1619
1620   /* Done with this block.  Clear REDIRECTION_DATA.  */
1621   delete redirection_data;
1622   redirection_data = NULL;
1623
1624   if (noloop_only
1625       && bb == bb->loop_father->header)
1626     set_loop_copy (bb->loop_father, NULL);
1627
1628   BITMAP_FREE (local_info.duplicate_blocks);
1629   local_info.duplicate_blocks = NULL;
1630
1631   /* Indicate to our caller whether or not any jumps were threaded.  */
1632   return local_info.jumps_threaded;
1633 }
1634
1635 /* Wrapper for thread_block_1 so that we can first handle jump
1636    thread paths which do not involve copying joiner blocks, then
1637    handle jump thread paths which have joiner blocks.
1638
1639    By doing things this way we can be as aggressive as possible and
1640    not worry that copying a joiner block will create a jump threading
1641    opportunity.  */
1642
1643 static bool
1644 thread_block (basic_block bb, bool noloop_only)
1645 {
1646   bool retval;
1647   retval = thread_block_1 (bb, noloop_only, false);
1648   retval |= thread_block_1 (bb, noloop_only, true);
1649   return retval;
1650 }
1651
1652 /* Callback for dfs_enumerate_from.  Returns true if BB is different
1653    from STOP and DBDS_CE_STOP.  */
1654
1655 static basic_block dbds_ce_stop;
1656 static bool
1657 dbds_continue_enumeration_p (const_basic_block bb, const void *stop)
1658 {
1659   return (bb != (const_basic_block) stop
1660           && bb != dbds_ce_stop);
1661 }
1662
1663 /* Evaluates the dominance relationship of latch of the LOOP and BB, and
1664    returns the state.  */
1665
1666 enum bb_dom_status
1667 determine_bb_domination_status (struct loop *loop, basic_block bb)
1668 {
1669   basic_block *bblocks;
1670   unsigned nblocks, i;
1671   bool bb_reachable = false;
1672   edge_iterator ei;
1673   edge e;
1674
1675   /* This function assumes BB is a successor of LOOP->header.
1676      If that is not the case return DOMST_NONDOMINATING which
1677      is always safe.  */
1678     {
1679       bool ok = false;
1680
1681       FOR_EACH_EDGE (e, ei, bb->preds)
1682         {
1683           if (e->src == loop->header)
1684             {
1685               ok = true;
1686               break;
1687             }
1688         }
1689
1690       if (!ok)
1691         return DOMST_NONDOMINATING;
1692     }
1693
1694   if (bb == loop->latch)
1695     return DOMST_DOMINATING;
1696
1697   /* Check that BB dominates LOOP->latch, and that it is back-reachable
1698      from it.  */
1699
1700   bblocks = XCNEWVEC (basic_block, loop->num_nodes);
1701   dbds_ce_stop = loop->header;
1702   nblocks = dfs_enumerate_from (loop->latch, 1, dbds_continue_enumeration_p,
1703                                 bblocks, loop->num_nodes, bb);
1704   for (i = 0; i < nblocks; i++)
1705     FOR_EACH_EDGE (e, ei, bblocks[i]->preds)
1706       {
1707         if (e->src == loop->header)
1708           {
1709             free (bblocks);
1710             return DOMST_NONDOMINATING;
1711           }
1712         if (e->src == bb)
1713           bb_reachable = true;
1714       }
1715
1716   free (bblocks);
1717   return (bb_reachable ? DOMST_DOMINATING : DOMST_LOOP_BROKEN);
1718 }
1719
1720 /* Thread jumps through the header of LOOP.  Returns true if cfg changes.
1721    If MAY_PEEL_LOOP_HEADERS is false, we avoid threading from entry edges
1722    to the inside of the loop.  */
1723
1724 static bool
1725 thread_through_loop_header (struct loop *loop, bool may_peel_loop_headers)
1726 {
1727   basic_block header = loop->header;
1728   edge e, tgt_edge, latch = loop_latch_edge (loop);
1729   edge_iterator ei;
1730   basic_block tgt_bb, atgt_bb;
1731   enum bb_dom_status domst;
1732
1733   /* We have already threaded through headers to exits, so all the threading
1734      requests now are to the inside of the loop.  We need to avoid creating
1735      irreducible regions (i.e., loops with more than one entry block), and
1736      also loop with several latch edges, or new subloops of the loop (although
1737      there are cases where it might be appropriate, it is difficult to decide,
1738      and doing it wrongly may confuse other optimizers).
1739
1740      We could handle more general cases here.  However, the intention is to
1741      preserve some information about the loop, which is impossible if its
1742      structure changes significantly, in a way that is not well understood.
1743      Thus we only handle few important special cases, in which also updating
1744      of the loop-carried information should be feasible:
1745
1746      1) Propagation of latch edge to a block that dominates the latch block
1747         of a loop.  This aims to handle the following idiom:
1748
1749         first = 1;
1750         while (1)
1751           {
1752             if (first)
1753               initialize;
1754             first = 0;
1755             body;
1756           }
1757
1758         After threading the latch edge, this becomes
1759
1760         first = 1;
1761         if (first)
1762           initialize;
1763         while (1)
1764           {
1765             first = 0;
1766             body;
1767           }
1768
1769         The original header of the loop is moved out of it, and we may thread
1770         the remaining edges through it without further constraints.
1771
1772      2) All entry edges are propagated to a single basic block that dominates
1773         the latch block of the loop.  This aims to handle the following idiom
1774         (normally created for "for" loops):
1775
1776         i = 0;
1777         while (1)
1778           {
1779             if (i >= 100)
1780               break;
1781             body;
1782             i++;
1783           }
1784
1785         This becomes
1786
1787         i = 0;
1788         while (1)
1789           {
1790             body;
1791             i++;
1792             if (i >= 100)
1793               break;
1794           }
1795      */
1796
1797   /* Threading through the header won't improve the code if the header has just
1798      one successor.  */
1799   if (single_succ_p (header))
1800     goto fail;
1801
1802   if (!may_peel_loop_headers && !redirection_block_p (loop->header))
1803     goto fail;
1804   else
1805     {
1806       tgt_bb = NULL;
1807       tgt_edge = NULL;
1808       FOR_EACH_EDGE (e, ei, header->preds)
1809         {
1810           if (!e->aux)
1811             {
1812               if (e == latch)
1813                 continue;
1814
1815               /* If latch is not threaded, and there is a header
1816                  edge that is not threaded, we would create loop
1817                  with multiple entries.  */
1818               goto fail;
1819             }
1820
1821           vec<jump_thread_edge *> *path = THREAD_PATH (e);
1822
1823           if ((*path)[1]->type == EDGE_COPY_SRC_JOINER_BLOCK)
1824             goto fail;
1825           tgt_edge = (*path)[1]->e;
1826           atgt_bb = tgt_edge->dest;
1827           if (!tgt_bb)
1828             tgt_bb = atgt_bb;
1829           /* Two targets of threading would make us create loop
1830              with multiple entries.  */
1831           else if (tgt_bb != atgt_bb)
1832             goto fail;
1833         }
1834
1835       if (!tgt_bb)
1836         {
1837           /* There are no threading requests.  */
1838           return false;
1839         }
1840
1841       /* Redirecting to empty loop latch is useless.  */
1842       if (tgt_bb == loop->latch
1843           && empty_block_p (loop->latch))
1844         goto fail;
1845     }
1846
1847   /* The target block must dominate the loop latch, otherwise we would be
1848      creating a subloop.  */
1849   domst = determine_bb_domination_status (loop, tgt_bb);
1850   if (domst == DOMST_NONDOMINATING)
1851     goto fail;
1852   if (domst == DOMST_LOOP_BROKEN)
1853     {
1854       /* If the loop ceased to exist, mark it as such, and thread through its
1855          original header.  */
1856       mark_loop_for_removal (loop);
1857       return thread_block (header, false);
1858     }
1859
1860   if (tgt_bb->loop_father->header == tgt_bb)
1861     {
1862       /* If the target of the threading is a header of a subloop, we need
1863          to create a preheader for it, so that the headers of the two loops
1864          do not merge.  */
1865       if (EDGE_COUNT (tgt_bb->preds) > 2)
1866         {
1867           tgt_bb = create_preheader (tgt_bb->loop_father, 0);
1868           gcc_assert (tgt_bb != NULL);
1869         }
1870       else
1871         tgt_bb = split_edge (tgt_edge);
1872     }
1873
1874   basic_block new_preheader;
1875
1876   /* Now consider the case entry edges are redirected to the new entry
1877      block.  Remember one entry edge, so that we can find the new
1878      preheader (its destination after threading).  */
1879   FOR_EACH_EDGE (e, ei, header->preds)
1880     {
1881       if (e->aux)
1882         break;
1883     }
1884
1885   /* The duplicate of the header is the new preheader of the loop.  Ensure
1886      that it is placed correctly in the loop hierarchy.  */
1887   set_loop_copy (loop, loop_outer (loop));
1888
1889   thread_block (header, false);
1890   set_loop_copy (loop, NULL);
1891   new_preheader = e->dest;
1892
1893   /* Create the new latch block.  This is always necessary, as the latch
1894      must have only a single successor, but the original header had at
1895      least two successors.  */
1896   loop->latch = NULL;
1897   mfb_kj_edge = single_succ_edge (new_preheader);
1898   loop->header = mfb_kj_edge->dest;
1899   latch = make_forwarder_block (tgt_bb, mfb_keep_just, NULL);
1900   loop->header = latch->dest;
1901   loop->latch = latch->src;
1902   return true;
1903
1904 fail:
1905   /* We failed to thread anything.  Cancel the requests.  */
1906   FOR_EACH_EDGE (e, ei, header->preds)
1907     {
1908       vec<jump_thread_edge *> *path = THREAD_PATH (e);
1909
1910       if (path)
1911         {
1912           delete_jump_thread_path (path);
1913           e->aux = NULL;
1914         }
1915     }
1916   return false;
1917 }
1918
1919 /* E1 and E2 are edges into the same basic block.  Return TRUE if the
1920    PHI arguments associated with those edges are equal or there are no
1921    PHI arguments, otherwise return FALSE.  */
1922
1923 static bool
1924 phi_args_equal_on_edges (edge e1, edge e2)
1925 {
1926   gphi_iterator gsi;
1927   int indx1 = e1->dest_idx;
1928   int indx2 = e2->dest_idx;
1929
1930   for (gsi = gsi_start_phis (e1->dest); !gsi_end_p (gsi); gsi_next (&gsi))
1931     {
1932       gphi *phi = gsi.phi ();
1933
1934       if (!operand_equal_p (gimple_phi_arg_def (phi, indx1),
1935                             gimple_phi_arg_def (phi, indx2), 0))
1936         return false;
1937     }
1938   return true;
1939 }
1940
1941 /* Walk through the registered jump threads and convert them into a
1942    form convenient for this pass.
1943
1944    Any block which has incoming edges threaded to outgoing edges
1945    will have its entry in THREADED_BLOCK set.
1946
1947    Any threaded edge will have its new outgoing edge stored in the
1948    original edge's AUX field.
1949
1950    This form avoids the need to walk all the edges in the CFG to
1951    discover blocks which need processing and avoids unnecessary
1952    hash table lookups to map from threaded edge to new target.  */
1953
1954 static void
1955 mark_threaded_blocks (bitmap threaded_blocks)
1956 {
1957   unsigned int i;
1958   bitmap_iterator bi;
1959   auto_bitmap tmp;
1960   basic_block bb;
1961   edge e;
1962   edge_iterator ei;
1963
1964   /* It is possible to have jump threads in which one is a subpath
1965      of the other.  ie, (A, B), (B, C), (C, D) where B is a joiner
1966      block and (B, C), (C, D) where no joiner block exists.
1967
1968      When this occurs ignore the jump thread request with the joiner
1969      block.  It's totally subsumed by the simpler jump thread request.
1970
1971      This results in less block copying, simpler CFGs.  More importantly,
1972      when we duplicate the joiner block, B, in this case we will create
1973      a new threading opportunity that we wouldn't be able to optimize
1974      until the next jump threading iteration.
1975
1976      So first convert the jump thread requests which do not require a
1977      joiner block.  */
1978   for (i = 0; i < paths.length (); i++)
1979     {
1980       vec<jump_thread_edge *> *path = paths[i];
1981
1982       if ((*path)[1]->type != EDGE_COPY_SRC_JOINER_BLOCK)
1983         {
1984           edge e = (*path)[0]->e;
1985           e->aux = (void *)path;
1986           bitmap_set_bit (tmp, e->dest->index);
1987         }
1988     }
1989
1990   /* Now iterate again, converting cases where we want to thread
1991      through a joiner block, but only if no other edge on the path
1992      already has a jump thread attached to it.  We do this in two passes,
1993      to avoid situations where the order in the paths vec can hide overlapping
1994      threads (the path is recorded on the incoming edge, so we would miss
1995      cases where the second path starts at a downstream edge on the same
1996      path).  First record all joiner paths, deleting any in the unexpected
1997      case where there is already a path for that incoming edge.  */
1998   for (i = 0; i < paths.length ();)
1999     {
2000       vec<jump_thread_edge *> *path = paths[i];
2001
2002       if ((*path)[1]->type == EDGE_COPY_SRC_JOINER_BLOCK)
2003         {
2004           /* Attach the path to the starting edge if none is yet recorded.  */
2005           if ((*path)[0]->e->aux == NULL)
2006             {
2007               (*path)[0]->e->aux = path;
2008               i++;
2009             }
2010           else
2011             {
2012               paths.unordered_remove (i);
2013               if (dump_file && (dump_flags & TDF_DETAILS))
2014                 dump_jump_thread_path (dump_file, *path, false);
2015               delete_jump_thread_path (path);
2016             }
2017         }
2018       else
2019         {
2020           i++;
2021         }
2022     }
2023
2024   /* Second, look for paths that have any other jump thread attached to
2025      them, and either finish converting them or cancel them.  */
2026   for (i = 0; i < paths.length ();)
2027     {
2028       vec<jump_thread_edge *> *path = paths[i];
2029       edge e = (*path)[0]->e;
2030
2031       if ((*path)[1]->type == EDGE_COPY_SRC_JOINER_BLOCK && e->aux == path)
2032         {
2033           unsigned int j;
2034           for (j = 1; j < path->length (); j++)
2035             if ((*path)[j]->e->aux != NULL)
2036               break;
2037
2038           /* If we iterated through the entire path without exiting the loop,
2039              then we are good to go, record it.  */
2040           if (j == path->length ())
2041             {
2042               bitmap_set_bit (tmp, e->dest->index);
2043               i++;
2044             }
2045           else
2046             {
2047               e->aux = NULL;
2048               paths.unordered_remove (i);
2049               if (dump_file && (dump_flags & TDF_DETAILS))
2050                 dump_jump_thread_path (dump_file, *path, false);
2051               delete_jump_thread_path (path);
2052             }
2053         }
2054       else
2055         {
2056           i++;
2057         }
2058     }
2059
2060   /* If optimizing for size, only thread through block if we don't have
2061      to duplicate it or it's an otherwise empty redirection block.  */
2062   if (optimize_function_for_size_p (cfun))
2063     {
2064       EXECUTE_IF_SET_IN_BITMAP (tmp, 0, i, bi)
2065         {
2066           bb = BASIC_BLOCK_FOR_FN (cfun, i);
2067           if (EDGE_COUNT (bb->preds) > 1
2068               && !redirection_block_p (bb))
2069             {
2070               FOR_EACH_EDGE (e, ei, bb->preds)
2071                 {
2072                   if (e->aux)
2073                     {
2074                       vec<jump_thread_edge *> *path = THREAD_PATH (e);
2075                       delete_jump_thread_path (path);
2076                       e->aux = NULL;
2077                     }
2078                 }
2079             }
2080           else
2081             bitmap_set_bit (threaded_blocks, i);
2082         }
2083     }
2084   else
2085     bitmap_copy (threaded_blocks, tmp);
2086
2087   /* If we have a joiner block (J) which has two successors S1 and S2 and
2088      we are threading though S1 and the final destination of the thread
2089      is S2, then we must verify that any PHI nodes in S2 have the same
2090      PHI arguments for the edge J->S2 and J->S1->...->S2.
2091
2092      We used to detect this prior to registering the jump thread, but
2093      that prohibits propagation of edge equivalences into non-dominated
2094      PHI nodes as the equivalency test might occur before propagation.
2095
2096      This must also occur after we truncate any jump threading paths
2097      as this scenario may only show up after truncation.
2098
2099      This works for now, but will need improvement as part of the FSA
2100      optimization.
2101
2102      Note since we've moved the thread request data to the edges,
2103      we have to iterate on those rather than the threaded_edges vector.  */
2104   EXECUTE_IF_SET_IN_BITMAP (tmp, 0, i, bi)
2105     {
2106       bb = BASIC_BLOCK_FOR_FN (cfun, i);
2107       FOR_EACH_EDGE (e, ei, bb->preds)
2108         {
2109           if (e->aux)
2110             {
2111               vec<jump_thread_edge *> *path = THREAD_PATH (e);
2112               bool have_joiner = ((*path)[1]->type == EDGE_COPY_SRC_JOINER_BLOCK);
2113
2114               if (have_joiner)
2115                 {
2116                   basic_block joiner = e->dest;
2117                   edge final_edge = path->last ()->e;
2118                   basic_block final_dest = final_edge->dest;
2119                   edge e2 = find_edge (joiner, final_dest);
2120
2121                   if (e2 && !phi_args_equal_on_edges (e2, final_edge))
2122                     {
2123                       delete_jump_thread_path (path);
2124                       e->aux = NULL;
2125                     }
2126                 }
2127             }
2128         }
2129     }
2130
2131   /* Look for jump threading paths which cross multiple loop headers.
2132
2133      The code to thread through loop headers will change the CFG in ways
2134      that invalidate the cached loop iteration information.  So we must
2135      detect that case and wipe the cached information.  */
2136   EXECUTE_IF_SET_IN_BITMAP (tmp, 0, i, bi)
2137     {
2138       basic_block bb = BASIC_BLOCK_FOR_FN (cfun, i);
2139       FOR_EACH_EDGE (e, ei, bb->preds)
2140         {
2141           if (e->aux)
2142             {
2143               vec<jump_thread_edge *> *path = THREAD_PATH (e);
2144
2145               for (unsigned int i = 0, crossed_headers = 0;
2146                    i < path->length ();
2147                    i++)
2148                 {
2149                   basic_block dest = (*path)[i]->e->dest;
2150                   basic_block src = (*path)[i]->e->src;
2151                   /* If we enter a loop.  */
2152                   if (flow_loop_nested_p (src->loop_father, dest->loop_father))
2153                     ++crossed_headers;
2154                   /* If we step from a block outside an irreducible region
2155                      to a block inside an irreducible region, then we have
2156                      crossed into a loop.  */
2157                   else if (! (src->flags & BB_IRREDUCIBLE_LOOP)
2158                            && (dest->flags & BB_IRREDUCIBLE_LOOP))
2159                       ++crossed_headers;
2160                   if (crossed_headers > 1)
2161                     {
2162                       vect_free_loop_info_assumptions
2163                         ((*path)[path->length () - 1]->e->dest->loop_father);
2164                       break;
2165                     }
2166                 }
2167             }
2168         }
2169     }
2170 }
2171
2172
2173 /* Verify that the REGION is a valid jump thread.  A jump thread is a special
2174    case of SEME Single Entry Multiple Exits region in which all nodes in the
2175    REGION have exactly one incoming edge.  The only exception is the first block
2176    that may not have been connected to the rest of the cfg yet.  */
2177
2178 DEBUG_FUNCTION void
2179 verify_jump_thread (basic_block *region, unsigned n_region)
2180 {
2181   for (unsigned i = 0; i < n_region; i++)
2182     gcc_assert (EDGE_COUNT (region[i]->preds) <= 1);
2183 }
2184
2185 /* Return true when BB is one of the first N items in BBS.  */
2186
2187 static inline bool
2188 bb_in_bbs (basic_block bb, basic_block *bbs, int n)
2189 {
2190   for (int i = 0; i < n; i++)
2191     if (bb == bbs[i])
2192       return true;
2193
2194   return false;
2195 }
2196
2197 /* Duplicates a jump-thread path of N_REGION basic blocks.
2198    The ENTRY edge is redirected to the duplicate of the region.
2199
2200    Remove the last conditional statement in the last basic block in the REGION,
2201    and create a single fallthru edge pointing to the same destination as the
2202    EXIT edge.
2203
2204    The new basic blocks are stored to REGION_COPY in the same order as they had
2205    in REGION, provided that REGION_COPY is not NULL.
2206
2207    Returns false if it is unable to copy the region, true otherwise.  */
2208
2209 static bool
2210 duplicate_thread_path (edge entry, edge exit,
2211                        basic_block *region, unsigned n_region,
2212                        basic_block *region_copy)
2213 {
2214   unsigned i;
2215   bool free_region_copy = false;
2216   struct loop *loop = entry->dest->loop_father;
2217   edge exit_copy;
2218   edge redirected;
2219   int curr_freq;
2220   profile_count curr_count;
2221
2222   if (!can_copy_bbs_p (region, n_region))
2223     return false;
2224
2225   /* Some sanity checking.  Note that we do not check for all possible
2226      missuses of the functions.  I.e. if you ask to copy something weird,
2227      it will work, but the state of structures probably will not be
2228      correct.  */
2229   for (i = 0; i < n_region; i++)
2230     {
2231       /* We do not handle subloops, i.e. all the blocks must belong to the
2232          same loop.  */
2233       if (region[i]->loop_father != loop)
2234         return false;
2235     }
2236
2237   initialize_original_copy_tables ();
2238
2239   set_loop_copy (loop, loop);
2240
2241   if (!region_copy)
2242     {
2243       region_copy = XNEWVEC (basic_block, n_region);
2244       free_region_copy = true;
2245     }
2246
2247   copy_bbs (region, n_region, region_copy, &exit, 1, &exit_copy, loop,
2248             split_edge_bb_loc (entry), false);
2249
2250   /* Fix up: copy_bbs redirects all edges pointing to copied blocks.  The
2251      following code ensures that all the edges exiting the jump-thread path are
2252      redirected back to the original code: these edges are exceptions
2253      invalidating the property that is propagated by executing all the blocks of
2254      the jump-thread path in order.  */
2255
2256   curr_count = entry->count;
2257   curr_freq = EDGE_FREQUENCY (entry);
2258
2259   for (i = 0; i < n_region; i++)
2260     {
2261       edge e;
2262       edge_iterator ei;
2263       basic_block bb = region_copy[i];
2264
2265       /* Watch inconsistent profile.  */
2266       if (curr_count > region[i]->count)
2267         curr_count = region[i]->count;
2268       if (curr_freq > region[i]->frequency)
2269         curr_freq = region[i]->frequency;
2270       /* Scale current BB.  */
2271       if (region[i]->count > 0 && curr_count.initialized_p ())
2272         {
2273           /* In the middle of the path we only scale the frequencies.
2274              In last BB we need to update probabilities of outgoing edges
2275              because we know which one is taken at the threaded path.  */
2276           if (i + 1 != n_region)
2277             scale_bbs_frequencies_profile_count (region + i, 1,
2278                                                  region[i]->count - curr_count,
2279                                                  region[i]->count);
2280           else
2281             update_bb_profile_for_threading (region[i],
2282                                              curr_freq, curr_count,
2283                                              exit);
2284           scale_bbs_frequencies_profile_count (region_copy + i, 1, curr_count,
2285                                                region_copy[i]->count);
2286         }
2287       else if (region[i]->frequency)
2288         {
2289           if (i + 1 != n_region)
2290             scale_bbs_frequencies_int (region + i, 1,
2291                                        region[i]->frequency - curr_freq,
2292                                        region[i]->frequency);
2293           else
2294             update_bb_profile_for_threading (region[i],
2295                                              curr_freq, curr_count,
2296                                              exit);
2297           scale_bbs_frequencies_int (region_copy + i, 1, curr_freq,
2298                                      region_copy[i]->frequency);
2299         }
2300
2301       if (single_succ_p (bb))
2302         {
2303           /* Make sure the successor is the next node in the path.  */
2304           gcc_assert (i + 1 == n_region
2305                       || region_copy[i + 1] == single_succ_edge (bb)->dest);
2306           if (i + 1 != n_region)
2307             {
2308               curr_freq = EDGE_FREQUENCY (single_succ_edge (bb));
2309               curr_count = single_succ_edge (bb)->count;
2310             }
2311           continue;
2312         }
2313
2314       /* Special case the last block on the path: make sure that it does not
2315          jump back on the copied path, including back to itself.  */
2316       if (i + 1 == n_region)
2317         {
2318           FOR_EACH_EDGE (e, ei, bb->succs)
2319             if (bb_in_bbs (e->dest, region_copy, n_region))
2320               {
2321                 basic_block orig = get_bb_original (e->dest);
2322                 if (orig)
2323                   redirect_edge_and_branch_force (e, orig);
2324               }
2325           continue;
2326         }
2327
2328       /* Redirect all other edges jumping to non-adjacent blocks back to the
2329          original code.  */
2330       FOR_EACH_EDGE (e, ei, bb->succs)
2331         if (region_copy[i + 1] != e->dest)
2332           {
2333             basic_block orig = get_bb_original (e->dest);
2334             if (orig)
2335               redirect_edge_and_branch_force (e, orig);
2336           }
2337         else
2338           {
2339             curr_freq = EDGE_FREQUENCY (e);
2340             curr_count = e->count;
2341           }
2342     }
2343
2344
2345   if (flag_checking)
2346     verify_jump_thread (region_copy, n_region);
2347
2348   /* Remove the last branch in the jump thread path.  */
2349   remove_ctrl_stmt_and_useless_edges (region_copy[n_region - 1], exit->dest);
2350
2351   /* And fixup the flags on the single remaining edge.  */
2352   edge fix_e = find_edge (region_copy[n_region - 1], exit->dest);
2353   fix_e->flags &= ~(EDGE_TRUE_VALUE | EDGE_FALSE_VALUE | EDGE_ABNORMAL);
2354   fix_e->flags |= EDGE_FALLTHRU;
2355
2356   edge e = make_edge (region_copy[n_region - 1], exit->dest, EDGE_FALLTHRU);
2357
2358   if (e)
2359     {
2360       rescan_loop_exit (e, true, false);
2361       e->probability = REG_BR_PROB_BASE;
2362       e->count = region_copy[n_region - 1]->count;
2363     }
2364
2365   /* Redirect the entry and add the phi node arguments.  */
2366   if (entry->dest == loop->header)
2367     mark_loop_for_removal (loop);
2368   redirected = redirect_edge_and_branch (entry, get_bb_copy (entry->dest));
2369   gcc_assert (redirected != NULL);
2370   flush_pending_stmts (entry);
2371
2372   /* Add the other PHI node arguments.  */
2373   add_phi_args_after_copy (region_copy, n_region, NULL);
2374
2375   if (free_region_copy)
2376     free (region_copy);
2377
2378   free_original_copy_tables ();
2379   return true;
2380 }
2381
2382 /* Return true when PATH is a valid jump-thread path.  */
2383
2384 static bool
2385 valid_jump_thread_path (vec<jump_thread_edge *> *path)
2386 {
2387   unsigned len = path->length ();
2388
2389   /* Check that the path is connected.  */
2390   for (unsigned int j = 0; j < len - 1; j++)
2391     {
2392       edge e = (*path)[j]->e;
2393       if (e->dest != (*path)[j+1]->e->src)
2394         return false;
2395     }
2396   return true;
2397 }
2398
2399 /* Remove any queued jump threads that include edge E.
2400
2401    We don't actually remove them here, just record the edges into ax
2402    hash table.  That way we can do the search once per iteration of
2403    DOM/VRP rather than for every case where DOM optimizes away a COND_EXPR.  */
2404
2405 void
2406 remove_jump_threads_including (edge_def *e)
2407 {
2408   if (!paths.exists ())
2409     return;
2410
2411   if (!removed_edges)
2412     removed_edges = new hash_table<struct removed_edges> (17);
2413
2414   edge *slot = removed_edges->find_slot (e, INSERT);
2415   *slot = e;
2416 }
2417
2418 /* Walk through all blocks and thread incoming edges to the appropriate
2419    outgoing edge for each edge pair recorded in THREADED_EDGES.
2420
2421    It is the caller's responsibility to fix the dominance information
2422    and rewrite duplicated SSA_NAMEs back into SSA form.
2423
2424    If MAY_PEEL_LOOP_HEADERS is false, we avoid threading edges through
2425    loop headers if it does not simplify the loop.
2426
2427    Returns true if one or more edges were threaded, false otherwise.  */
2428
2429 bool
2430 thread_through_all_blocks (bool may_peel_loop_headers)
2431 {
2432   bool retval = false;
2433   unsigned int i;
2434   bitmap_iterator bi;
2435   struct loop *loop;
2436   auto_bitmap threaded_blocks;
2437
2438   if (!paths.exists ())
2439     {
2440       retval = false;
2441       goto out;
2442     }
2443
2444   memset (&thread_stats, 0, sizeof (thread_stats));
2445
2446   /* Remove any paths that referenced removed edges.  */
2447   if (removed_edges)
2448     for (i = 0; i < paths.length (); )
2449       {
2450         unsigned int j;
2451         vec<jump_thread_edge *> *path = paths[i];
2452
2453         for (j = 0; j < path->length (); j++)
2454           {
2455             edge e = (*path)[j]->e;
2456             if (removed_edges->find_slot (e, NO_INSERT))
2457               break;
2458           }
2459
2460         if (j != path->length ())
2461           {
2462             delete_jump_thread_path (path);
2463             paths.unordered_remove (i);
2464             continue;
2465           }
2466         i++;
2467       }
2468
2469   /* Jump-thread all FSM threads before other jump-threads.  */
2470   for (i = 0; i < paths.length ();)
2471     {
2472       vec<jump_thread_edge *> *path = paths[i];
2473       edge entry = (*path)[0]->e;
2474
2475       /* Only code-generate FSM jump-threads in this loop.  */
2476       if ((*path)[0]->type != EDGE_FSM_THREAD)
2477         {
2478           i++;
2479           continue;
2480         }
2481
2482       /* Do not jump-thread twice from the same block.  */
2483       if (bitmap_bit_p (threaded_blocks, entry->src->index)
2484           /* We may not want to realize this jump thread path
2485              for various reasons.  So check it first.  */
2486           || !valid_jump_thread_path (path))
2487         {
2488           /* Remove invalid FSM jump-thread paths.  */
2489           delete_jump_thread_path (path);
2490           paths.unordered_remove (i);
2491           continue;
2492         }
2493
2494       unsigned len = path->length ();
2495       edge exit = (*path)[len - 1]->e;
2496       basic_block *region = XNEWVEC (basic_block, len - 1);
2497
2498       for (unsigned int j = 0; j < len - 1; j++)
2499         region[j] = (*path)[j]->e->dest;
2500
2501       if (duplicate_thread_path (entry, exit, region, len - 1, NULL))
2502         {
2503           /* We do not update dominance info.  */
2504           free_dominance_info (CDI_DOMINATORS);
2505           bitmap_set_bit (threaded_blocks, entry->src->index);
2506           retval = true;
2507           thread_stats.num_threaded_edges++;
2508         }
2509
2510       delete_jump_thread_path (path);
2511       paths.unordered_remove (i);
2512       free (region);
2513     }
2514
2515   /* Remove from PATHS all the jump-threads starting with an edge already
2516      jump-threaded.  */
2517   for (i = 0; i < paths.length ();)
2518     {
2519       vec<jump_thread_edge *> *path = paths[i];
2520       edge entry = (*path)[0]->e;
2521
2522       /* Do not jump-thread twice from the same block.  */
2523       if (bitmap_bit_p (threaded_blocks, entry->src->index))
2524         {
2525           delete_jump_thread_path (path);
2526           paths.unordered_remove (i);
2527         }
2528       else
2529         i++;
2530     }
2531
2532   bitmap_clear (threaded_blocks);
2533
2534   mark_threaded_blocks (threaded_blocks);
2535
2536   initialize_original_copy_tables ();
2537
2538   /* First perform the threading requests that do not affect
2539      loop structure.  */
2540   EXECUTE_IF_SET_IN_BITMAP (threaded_blocks, 0, i, bi)
2541     {
2542       basic_block bb = BASIC_BLOCK_FOR_FN (cfun, i);
2543
2544       if (EDGE_COUNT (bb->preds) > 0)
2545         retval |= thread_block (bb, true);
2546     }
2547
2548   /* Then perform the threading through loop headers.  We start with the
2549      innermost loop, so that the changes in cfg we perform won't affect
2550      further threading.  */
2551   FOR_EACH_LOOP (loop, LI_FROM_INNERMOST)
2552     {
2553       if (!loop->header
2554           || !bitmap_bit_p (threaded_blocks, loop->header->index))
2555         continue;
2556
2557       retval |= thread_through_loop_header (loop, may_peel_loop_headers);
2558     }
2559
2560   /* All jump threading paths should have been resolved at this
2561      point.  Verify that is the case.  */
2562   basic_block bb;
2563   FOR_EACH_BB_FN (bb, cfun)
2564     {
2565       edge_iterator ei;
2566       edge e;
2567       FOR_EACH_EDGE (e, ei, bb->preds)
2568         gcc_assert (e->aux == NULL);
2569     }
2570
2571   statistics_counter_event (cfun, "Jumps threaded",
2572                             thread_stats.num_threaded_edges);
2573
2574   free_original_copy_tables ();
2575
2576   paths.release ();
2577
2578   if (retval)
2579     loops_state_set (LOOPS_NEED_FIXUP);
2580
2581  out:
2582   delete removed_edges;
2583   removed_edges = NULL;
2584   return retval;
2585 }
2586
2587 /* Delete the jump threading path PATH.  We have to explcitly delete
2588    each entry in the vector, then the container.  */
2589
2590 void
2591 delete_jump_thread_path (vec<jump_thread_edge *> *path)
2592 {
2593   for (unsigned int i = 0; i < path->length (); i++)
2594     delete (*path)[i];
2595   path->release();
2596   delete path;
2597 }
2598
2599 /* Register a jump threading opportunity.  We queue up all the jump
2600    threading opportunities discovered by a pass and update the CFG
2601    and SSA form all at once.
2602
2603    E is the edge we can thread, E2 is the new target edge, i.e., we
2604    are effectively recording that E->dest can be changed to E2->dest
2605    after fixing the SSA graph.  */
2606
2607 void
2608 register_jump_thread (vec<jump_thread_edge *> *path)
2609 {
2610   if (!dbg_cnt (registered_jump_thread))
2611     {
2612       delete_jump_thread_path (path);
2613       return;
2614     }
2615
2616   /* First make sure there are no NULL outgoing edges on the jump threading
2617      path.  That can happen for jumping to a constant address.  */
2618   for (unsigned int i = 0; i < path->length (); i++)
2619     {
2620       if ((*path)[i]->e == NULL)
2621         {
2622           if (dump_file && (dump_flags & TDF_DETAILS))
2623             {
2624               fprintf (dump_file,
2625                        "Found NULL edge in jump threading path.  Cancelling jump thread:\n");
2626               dump_jump_thread_path (dump_file, *path, false);
2627             }
2628
2629           delete_jump_thread_path (path);
2630           return;
2631         }
2632
2633       /* Only the FSM threader is allowed to thread across
2634          backedges in the CFG.  */
2635       if (flag_checking
2636           && (*path)[0]->type != EDGE_FSM_THREAD)
2637         gcc_assert (((*path)[i]->e->flags & EDGE_DFS_BACK) == 0);
2638     }
2639
2640   if (dump_file && (dump_flags & TDF_DETAILS))
2641     dump_jump_thread_path (dump_file, *path, true);
2642
2643   if (!paths.exists ())
2644     paths.create (5);
2645
2646   paths.safe_push (path);
2647 }