gcc/tree-ssa-loop-split.cc

   1 /* Loop splitting.
   2    Copyright (C) 2015-2023 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the
   8 Free Software Foundation; either version 3, or (at your option) any
   9 later version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT
  12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 #include "config.h"
  21 #include "system.h"
  22 #include "coretypes.h"
  23 #include "backend.h"
  24 #include "tree.h"
  25 #include "gimple.h"
  26 #include "tree-pass.h"
  27 #include "ssa.h"
  28 #include "fold-const.h"
  29 #include "tree-cfg.h"
  30 #include "tree-ssa.h"
  31 #include "tree-ssa-loop-niter.h"
  32 #include "tree-ssa-loop.h"
  33 #include "tree-ssa-loop-manip.h"
  34 #include "tree-into-ssa.h"
  35 #include "tree-inline.h"
  36 #include "tree-cfgcleanup.h"
  37 #include "cfgloop.h"
  38 #include "tree-scalar-evolution.h"
  39 #include "gimple-iterator.h"
  40 #include "gimple-pretty-print.h"
  41 #include "cfghooks.h"
  42 #include "gimple-fold.h"
  43 #include "gimplify-me.h"
  44
  45 /* This file implements two kinds of loop splitting.
  46
  47    One transformation of loops like:
  48
  49    for (i = 0; i < 100; i++)
  50      {
  51        if (i < 50)
  52          A;
  53        else
  54          B;
  55      }
  56
  57    into:
  58
  59    for (i = 0; i < 50; i++)
  60      {
  61        A;
  62      }
  63    for (; i < 100; i++)
  64      {
  65        B;
  66      }
  67
  68    */
  69
  70 /* Return true when BB inside LOOP is a potential iteration space
  71    split point, i.e. ends with a condition like "IV < comp", which
  72    is true on one side of the iteration space and false on the other,
  73    and the split point can be computed.  If so, also return the border
  74    point in *BORDER and the comparison induction variable in IV.  */
  75
  76 static tree
  77 split_at_bb_p (class loop *loop, basic_block bb, tree *border, affine_iv *iv)
  78 {
  79   gimple *last;
  80   gcond *stmt;
  81   affine_iv iv2;
  82
  83   /* BB must end in a simple conditional jump.  */
  84   last = last_stmt (bb);
  85   if (!last || gimple_code (last) != GIMPLE_COND)
  86     return NULL_TREE;
  87   stmt = as_a <gcond *> (last);
  88
  89   enum tree_code code = gimple_cond_code (stmt);
  90
  91   /* Only handle relational comparisons, for equality and non-equality
  92      we'd have to split the loop into two loops and a middle statement.  */
  93   switch (code)
  94     {
  95       case LT_EXPR:
  96       case LE_EXPR:
  97       case GT_EXPR:
  98       case GE_EXPR:
  99         break;
 100       default:
 101         return NULL_TREE;
 102     }
 103
 104   if (loop_exits_from_bb_p (loop, bb))
 105     return NULL_TREE;
 106
 107   tree op0 = gimple_cond_lhs (stmt);
 108   tree op1 = gimple_cond_rhs (stmt);
 109   class loop *useloop = loop_containing_stmt (stmt);
 110
 111   if (!simple_iv (loop, useloop, op0, iv, false))
 112     return NULL_TREE;
 113   if (!simple_iv (loop, useloop, op1, &iv2, false))
 114     return NULL_TREE;
 115
 116   /* Make it so that the first argument of the condition is
 117      the looping one.  */
 118   if (!integer_zerop (iv2.step))
 119     {
 120       std::swap (op0, op1);
 121       std::swap (*iv, iv2);
 122       code = swap_tree_comparison (code);
 123       gimple_cond_set_condition (stmt, code, op0, op1);
 124       update_stmt (stmt);
 125     }
 126   else if (integer_zerop (iv->step))
 127     return NULL_TREE;
 128   if (!integer_zerop (iv2.step))
 129     return NULL_TREE;
 130   if (!iv->no_overflow)
 131     return NULL_TREE;
 132
 133   if (dump_file && (dump_flags & TDF_DETAILS))
 134     {
 135       fprintf (dump_file, "Found potential split point: ");
 136       print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
 137       fprintf (dump_file, " { ");
 138       print_generic_expr (dump_file, iv->base, TDF_SLIM);
 139       fprintf (dump_file, " + I*");
 140       print_generic_expr (dump_file, iv->step, TDF_SLIM);
 141       fprintf (dump_file, " } %s ", get_tree_code_name (code));
 142       print_generic_expr (dump_file, iv2.base, TDF_SLIM);
 143       fprintf (dump_file, "\n");
 144     }
 145
 146   *border = iv2.base;
 147   return op0;
 148 }
 149
 150 /* Given a GUARD conditional stmt inside LOOP, which we want to make always
 151    true or false depending on INITIAL_TRUE, and adjusted values NEXTVAL
 152    (a post-increment IV) and NEWBOUND (the comparator) adjust the loop
 153    exit test statement to loop back only if the GUARD statement will
 154    also be true/false in the next iteration.  */
 155
 156 static void
 157 patch_loop_exit (class loop *loop, gcond *guard, tree nextval, tree newbound,
 158                  bool initial_true)
 159 {
 160   edge exit = single_exit (loop);
 161   gcond *stmt = as_a <gcond *> (last_stmt (exit->src));
 162   gimple_cond_set_condition (stmt, gimple_cond_code (guard),
 163                              nextval, newbound);
 164   update_stmt (stmt);
 165
 166   edge stay = EDGE_SUCC (exit->src, EDGE_SUCC (exit->src, 0) == exit);
 167
 168   exit->flags &= ~(EDGE_TRUE_VALUE | EDGE_FALSE_VALUE);
 169   stay->flags &= ~(EDGE_TRUE_VALUE | EDGE_FALSE_VALUE);
 170
 171   if (initial_true)
 172     {
 173       exit->flags |= EDGE_FALSE_VALUE;
 174       stay->flags |= EDGE_TRUE_VALUE;
 175     }
 176   else
 177     {
 178       exit->flags |= EDGE_TRUE_VALUE;
 179       stay->flags |= EDGE_FALSE_VALUE;
 180     }
 181 }
 182
 183 /* Give an induction variable GUARD_IV, and its affine descriptor IV,
 184    find the loop phi node in LOOP defining it directly, or create
 185    such phi node.  Return that phi node.  */
 186
 187 static gphi *
 188 find_or_create_guard_phi (class loop *loop, tree guard_iv, affine_iv * /*iv*/)
 189 {
 190   gimple *def = SSA_NAME_DEF_STMT (guard_iv);
 191   gphi *phi;
 192   if ((phi = dyn_cast <gphi *> (def))
 193       && gimple_bb (phi) == loop->header)
 194     return phi;
 195
 196   /* XXX Create the PHI instead.  */
 197   return NULL;
 198 }
 199
 200 /* Returns true if the exit values of all loop phi nodes can be
 201    determined easily (i.e. that connect_loop_phis can determine them).  */
 202
 203 static bool
 204 easy_exit_values (class loop *loop)
 205 {
 206   edge exit = single_exit (loop);
 207   edge latch = loop_latch_edge (loop);
 208   gphi_iterator psi;
 209
 210   /* Currently we regard the exit values as easy if they are the same
 211      as the value over the backedge.  Which is the case if the definition
 212      of the backedge value dominates the exit edge.  */
 213   for (psi = gsi_start_phis (loop->header); !gsi_end_p (psi); gsi_next (&psi))
 214     {
 215       gphi *phi = psi.phi ();
 216       tree next = PHI_ARG_DEF_FROM_EDGE (phi, latch);
 217       basic_block bb;
 218       if (TREE_CODE (next) == SSA_NAME
 219           && (bb = gimple_bb (SSA_NAME_DEF_STMT (next)))
 220           && !dominated_by_p (CDI_DOMINATORS, exit->src, bb))
 221         return false;
 222     }
 223
 224   return true;
 225 }
 226
 227 /* This function updates the SSA form after connect_loops made a new
 228    edge NEW_E leading from LOOP1 exit to LOOP2 (via in intermediate
 229    conditional).  I.e. the second loop can now be entered either
 230    via the original entry or via NEW_E, so the entry values of LOOP2
 231    phi nodes are either the original ones or those at the exit
 232    of LOOP1.  Insert new phi nodes in LOOP2 pre-header reflecting
 233    this.  The loops need to fulfill easy_exit_values().  */
 234
 235 static void
 236 connect_loop_phis (class loop *loop1, class loop *loop2, edge new_e)
 237 {
 238   basic_block rest = loop_preheader_edge (loop2)->src;
 239   gcc_assert (new_e->dest == rest);
 240   edge skip_first = EDGE_PRED (rest, EDGE_PRED (rest, 0) == new_e);
 241
 242   edge firste = loop_preheader_edge (loop1);
 243   edge seconde = loop_preheader_edge (loop2);
 244   edge firstn = loop_latch_edge (loop1);
 245   gphi_iterator psi_first, psi_second;
 246   for (psi_first = gsi_start_phis (loop1->header),
 247        psi_second = gsi_start_phis (loop2->header);
 248        !gsi_end_p (psi_first);
 249        gsi_next (&psi_first), gsi_next (&psi_second))
 250     {
 251       tree init, next, new_init;
 252       use_operand_p op;
 253       gphi *phi_first = psi_first.phi ();
 254       gphi *phi_second = psi_second.phi ();
 255
 256       init = PHI_ARG_DEF_FROM_EDGE (phi_first, firste);
 257       next = PHI_ARG_DEF_FROM_EDGE (phi_first, firstn);
 258       op = PHI_ARG_DEF_PTR_FROM_EDGE (phi_second, seconde);
 259       gcc_assert (operand_equal_for_phi_arg_p (init, USE_FROM_PTR (op)));
 260
 261       /* Prefer using original variable as a base for the new ssa name.
 262          This is necessary for virtual ops, and useful in order to avoid
 263          losing debug info for real ops.  */
 264       if (TREE_CODE (next) == SSA_NAME
 265           && useless_type_conversion_p (TREE_TYPE (next),
 266                                         TREE_TYPE (init)))
 267         new_init = copy_ssa_name (next);
 268       else if (TREE_CODE (init) == SSA_NAME
 269                && useless_type_conversion_p (TREE_TYPE (init),
 270                                              TREE_TYPE (next)))
 271         new_init = copy_ssa_name (init);
 272       else if (useless_type_conversion_p (TREE_TYPE (next),
 273                                           TREE_TYPE (init)))
 274         new_init = make_temp_ssa_name (TREE_TYPE (next), NULL,
 275                                        "unrinittmp");
 276       else
 277         new_init = make_temp_ssa_name (TREE_TYPE (init), NULL,
 278                                        "unrinittmp");
 279
 280       gphi * newphi = create_phi_node (new_init, rest);
 281       add_phi_arg (newphi, init, skip_first, UNKNOWN_LOCATION);
 282       add_phi_arg (newphi, next, new_e, UNKNOWN_LOCATION);
 283       SET_USE (op, new_init);
 284     }
 285 }
 286
 287 /* The two loops LOOP1 and LOOP2 were just created by loop versioning,
 288    they are still equivalent and placed in two arms of a diamond, like so:
 289
 290                .------if (cond)------.
 291                v                     v
 292              pre1                   pre2
 293               |                      |
 294         .--->h1                     h2<----.
 295         |     |                      |     |
 296         |    ex1---.            .---ex2    |
 297         |    /     |            |     \    |
 298         '---l1     X            |     l2---'
 299                    |            |
 300                    |            |
 301                    '--->join<---'
 302
 303    This function transforms the program such that LOOP1 is conditionally
 304    falling through to LOOP2, or skipping it.  This is done by splitting
 305    the ex1->join edge at X in the diagram above, and inserting a condition
 306    whose one arm goes to pre2, resulting in this situation:
 307
 308                .------if (cond)------.
 309                v                     v
 310              pre1       .---------->pre2
 311               |         |            |
 312         .--->h1         |           h2<----.
 313         |     |         |            |     |
 314         |    ex1---.    |       .---ex2    |
 315         |    /     v    |       |     \    |
 316         '---l1   skip---'       |     l2---'
 317                    |            |
 318                    |            |
 319                    '--->join<---'
 320
 321
 322    The condition used is the exit condition of LOOP1, which effectively means
 323    that when the first loop exits (for whatever reason) but the real original
 324    exit expression is still false the second loop will be entered.
 325    The function returns the new edge cond->pre2.
 326
 327    This doesn't update the SSA form, see connect_loop_phis for that.  */
 328
 329 static edge
 330 connect_loops (class loop *loop1, class loop *loop2)
 331 {
 332   edge exit = single_exit (loop1);
 333   basic_block skip_bb = split_edge (exit);
 334   gcond *skip_stmt;
 335   gimple_stmt_iterator gsi;
 336   edge new_e, skip_e;
 337
 338   gimple *stmt = last_stmt (exit->src);
 339   skip_stmt = gimple_build_cond (gimple_cond_code (stmt),
 340                                  gimple_cond_lhs (stmt),
 341                                  gimple_cond_rhs (stmt),
 342                                  NULL_TREE, NULL_TREE);
 343   gsi = gsi_last_bb (skip_bb);
 344   gsi_insert_after (&gsi, skip_stmt, GSI_NEW_STMT);
 345
 346   skip_e = EDGE_SUCC (skip_bb, 0);
 347   skip_e->flags &= ~EDGE_FALLTHRU;
 348   new_e = make_edge (skip_bb, loop_preheader_edge (loop2)->src, 0);
 349   if (exit->flags & EDGE_TRUE_VALUE)
 350     {
 351       skip_e->flags |= EDGE_TRUE_VALUE;
 352       new_e->flags |= EDGE_FALSE_VALUE;
 353     }
 354   else
 355     {
 356       skip_e->flags |= EDGE_FALSE_VALUE;
 357       new_e->flags |= EDGE_TRUE_VALUE;
 358     }
 359
 360   new_e->probability = profile_probability::likely ();
 361   skip_e->probability = new_e->probability.invert ();
 362
 363   return new_e;
 364 }
 365
 366 /* This returns the new bound for iterations given the original iteration
 367    space in NITER, an arbitrary new bound BORDER, assumed to be some
 368    comparison value with a different IV, the initial value GUARD_INIT of
 369    that other IV, and the comparison code GUARD_CODE that compares
 370    that other IV with BORDER.  We return an SSA name, and place any
 371    necessary statements for that computation into *STMTS.
 372
 373    For example for such a loop:
 374
 375      for (i = beg, j = guard_init; i < end; i++, j++)
 376        if (j < border)  // this is supposed to be true/false
 377          ...
 378
 379    we want to return a new bound (on j) that makes the loop iterate
 380    as long as the condition j < border stays true.  We also don't want
 381    to iterate more often than the original loop, so we have to introduce
 382    some cut-off as well (via min/max), effectively resulting in:
 383
 384      newend = min (end+guard_init-beg, border)
 385      for (i = beg; j = guard_init; j < newend; i++, j++)
 386        if (j < c)
 387          ...
 388
 389    Depending on the direction of the IVs and if the exit tests
 390    are strict or non-strict we need to use MIN or MAX,
 391    and add or subtract 1.  This routine computes newend above.  */
 392
 393 static tree
 394 compute_new_first_bound (gimple_seq *stmts, class tree_niter_desc *niter,
 395                          tree border,
 396                          enum tree_code guard_code, tree guard_init)
 397 {
 398   /* The niter structure contains the after-increment IV, we need
 399      the loop-enter base, so subtract STEP once.  */
 400   tree controlbase = force_gimple_operand (niter->control.base,
 401                                            stmts, true, NULL_TREE);
 402   tree controlstep = niter->control.step;
 403   tree enddiff;
 404   if (POINTER_TYPE_P (TREE_TYPE (controlbase)))
 405     {
 406       controlstep = gimple_build (stmts, NEGATE_EXPR,
 407                                   TREE_TYPE (controlstep), controlstep);
 408       enddiff = gimple_build (stmts, POINTER_PLUS_EXPR,
 409                               TREE_TYPE (controlbase),
 410                               controlbase, controlstep);
 411     }
 412   else
 413     enddiff = gimple_build (stmts, MINUS_EXPR,
 414                             TREE_TYPE (controlbase),
 415                             controlbase, controlstep);
 416
 417   /* Compute end-beg.  */
 418   gimple_seq stmts2;
 419   tree end = force_gimple_operand (niter->bound, &stmts2,
 420                                         true, NULL_TREE);
 421   gimple_seq_add_seq_without_update (stmts, stmts2);
 422   if (POINTER_TYPE_P (TREE_TYPE (enddiff)))
 423     {
 424       tree tem = gimple_convert (stmts, sizetype, enddiff);
 425       tem = gimple_build (stmts, NEGATE_EXPR, sizetype, tem);
 426       enddiff = gimple_build (stmts, POINTER_PLUS_EXPR,
 427                               TREE_TYPE (enddiff),
 428                               end, tem);
 429     }
 430   else
 431     enddiff = gimple_build (stmts, MINUS_EXPR, TREE_TYPE (enddiff),
 432                             end, enddiff);
 433
 434   /* Compute guard_init + (end-beg).  */
 435   tree newbound;
 436   enddiff = gimple_convert (stmts, TREE_TYPE (guard_init), enddiff);
 437   if (POINTER_TYPE_P (TREE_TYPE (guard_init)))
 438     {
 439       enddiff = gimple_convert (stmts, sizetype, enddiff);
 440       newbound = gimple_build (stmts, POINTER_PLUS_EXPR,
 441                                TREE_TYPE (guard_init),
 442                                guard_init, enddiff);
 443     }
 444   else
 445     newbound = gimple_build (stmts, PLUS_EXPR, TREE_TYPE (guard_init),
 446                              guard_init, enddiff);
 447
 448   /* Depending on the direction of the IVs the new bound for the first
 449      loop is the minimum or maximum of old bound and border.
 450      Also, if the guard condition isn't strictly less or greater,
 451      we need to adjust the bound.  */
 452   int addbound = 0;
 453   enum tree_code minmax;
 454   if (niter->cmp == LT_EXPR)
 455     {
 456       /* GT and LE are the same, inverted.  */
 457       if (guard_code == GT_EXPR || guard_code == LE_EXPR)
 458         addbound = -1;
 459       minmax = MIN_EXPR;
 460     }
 461   else
 462     {
 463       gcc_assert (niter->cmp == GT_EXPR);
 464       if (guard_code == GE_EXPR || guard_code == LT_EXPR)
 465         addbound = 1;
 466       minmax = MAX_EXPR;
 467     }
 468
 469   if (addbound)
 470     {
 471       tree type2 = TREE_TYPE (newbound);
 472       if (POINTER_TYPE_P (type2))
 473         type2 = sizetype;
 474       newbound = gimple_build (stmts,
 475                                POINTER_TYPE_P (TREE_TYPE (newbound))
 476                                ? POINTER_PLUS_EXPR : PLUS_EXPR,
 477                                TREE_TYPE (newbound),
 478                                newbound,
 479                                build_int_cst (type2, addbound));
 480     }
 481
 482   tree newend = gimple_build (stmts, minmax, TREE_TYPE (border),
 483                               border, newbound);
 484   return newend;
 485 }
 486
 487 /* Fix the two loop's bb count after split based on the split edge probability,
 488    don't adjust the bbs dominated by true branches of that loop to avoid
 489    dropping 1s down.  */
 490 static void
 491 fix_loop_bb_probability (class loop *loop1, class loop *loop2, edge true_edge,
 492                          edge false_edge)
 493 {
 494   /* Proportion first loop's bb counts except those dominated by true
 495      branch to avoid drop 1s down.  */
 496   basic_block *bbs1, *bbs2;
 497   bbs1 = get_loop_body (loop1);
 498   unsigned j;
 499   for (j = 0; j < loop1->num_nodes; j++)
 500     if (bbs1[j] == loop1->latch
 501         || !dominated_by_p (CDI_DOMINATORS, bbs1[j], true_edge->dest))
 502       bbs1[j]->count
 503         = bbs1[j]->count.apply_probability (true_edge->probability);
 504   free (bbs1);
 505
 506   /* Proportion second loop's bb counts except those dominated by false
 507      branch to avoid drop 1s down.  */
 508   basic_block bbi_copy = get_bb_copy (false_edge->dest);
 509   bbs2 = get_loop_body (loop2);
 510   for (j = 0; j < loop2->num_nodes; j++)
 511     if (bbs2[j] == loop2->latch
 512         || !dominated_by_p (CDI_DOMINATORS, bbs2[j], bbi_copy))
 513       bbs2[j]->count
 514         = bbs2[j]->count.apply_probability (true_edge->probability.invert ());
 515   free (bbs2);
 516 }
 517
 518 /* Checks if LOOP contains an conditional block whose condition
 519    depends on which side in the iteration space it is, and if so
 520    splits the iteration space into two loops.  Returns true if the
 521    loop was split.  NITER must contain the iteration descriptor for the
 522    single exit of LOOP.  */
 523
 524 static bool
 525 split_loop (class loop *loop1)
 526 {
 527   class tree_niter_desc niter;
 528   basic_block *bbs;
 529   unsigned i;
 530   bool changed = false;
 531   tree guard_iv;
 532   tree border = NULL_TREE;
 533   affine_iv iv;
 534   edge exit1;
 535
 536   if (!(exit1 = single_exit (loop1))
 537       || EDGE_COUNT (exit1->src->succs) != 2
 538       /* ??? We could handle non-empty latches when we split the latch edge
 539          (not the exit edge), and put the new exit condition in the new block.
 540          OTOH this executes some code unconditionally that might have been
 541          skipped by the original exit before.  */
 542       || !empty_block_p (loop1->latch)
 543       || !easy_exit_values (loop1)
 544       || !number_of_iterations_exit (loop1, exit1, &niter, false, true)
 545       || niter.cmp == ERROR_MARK
 546       /* We can't yet handle loops controlled by a != predicate.  */
 547       || niter.cmp == NE_EXPR)
 548     return false;
 549
 550   bbs = get_loop_body (loop1);
 551
 552   if (!can_copy_bbs_p (bbs, loop1->num_nodes))
 553     {
 554       free (bbs);
 555       return false;
 556     }
 557
 558   /* Find a splitting opportunity.  */
 559   for (i = 0; i < loop1->num_nodes; i++)
 560     if ((guard_iv = split_at_bb_p (loop1, bbs[i], &border, &iv)))
 561       {
 562         /* Handling opposite steps is not implemented yet.  Neither
 563            is handling different step sizes.  */
 564         if ((tree_int_cst_sign_bit (iv.step)
 565              != tree_int_cst_sign_bit (niter.control.step))
 566             || !tree_int_cst_equal (iv.step, niter.control.step))
 567           continue;
 568
 569         /* Find a loop PHI node that defines guard_iv directly,
 570            or create one doing that.  */
 571         gphi *phi = find_or_create_guard_phi (loop1, guard_iv, &iv);
 572         if (!phi)
 573           continue;
 574         gcond *guard_stmt = as_a<gcond *> (last_stmt (bbs[i]));
 575         tree guard_init = PHI_ARG_DEF_FROM_EDGE (phi,
 576                                                  loop_preheader_edge (loop1));
 577         enum tree_code guard_code = gimple_cond_code (guard_stmt);
 578
 579         /* Loop splitting is implemented by versioning the loop, placing
 580            the new loop after the old loop, make the first loop iterate
 581            as long as the conditional stays true (or false) and let the
 582            second (new) loop handle the rest of the iterations.
 583
 584            First we need to determine if the condition will start being true
 585            or false in the first loop.  */
 586         bool initial_true;
 587         switch (guard_code)
 588           {
 589             case LT_EXPR:
 590             case LE_EXPR:
 591               initial_true = !tree_int_cst_sign_bit (iv.step);
 592               break;
 593             case GT_EXPR:
 594             case GE_EXPR:
 595               initial_true = tree_int_cst_sign_bit (iv.step);
 596               break;
 597             default:
 598               gcc_unreachable ();
 599           }
 600
 601         /* Build a condition that will skip the first loop when the
 602            guard condition won't ever be true (or false).  */
 603         gimple_seq stmts2;
 604         border = force_gimple_operand (border, &stmts2, true, NULL_TREE);
 605         if (stmts2)
 606           gsi_insert_seq_on_edge_immediate (loop_preheader_edge (loop1),
 607                                             stmts2);
 608         tree cond = build2 (guard_code, boolean_type_node, guard_init, border);
 609         if (!initial_true)
 610           cond = fold_build1 (TRUTH_NOT_EXPR, boolean_type_node, cond);
 611
 612         edge true_edge, false_edge;
 613         extract_true_false_edges_from_block (bbs[i], &true_edge, &false_edge);
 614
 615         /* Now version the loop, placing loop2 after loop1 connecting
 616            them, and fix up SSA form for that.  */
 617         initialize_original_copy_tables ();
 618         basic_block cond_bb;
 619
 620         class loop *loop2 = loop_version (loop1, cond, &cond_bb,
 621                                           true_edge->probability,
 622                                           true_edge->probability.invert (),
 623                                           profile_probability::always (),
 624                                           profile_probability::always (),
 625                                           true);
 626         gcc_assert (loop2);
 627
 628         edge new_e = connect_loops (loop1, loop2);
 629         connect_loop_phis (loop1, loop2, new_e);
 630
 631         /* The iterations of the second loop is now already
 632            exactly those that the first loop didn't do, but the
 633            iteration space of the first loop is still the original one.
 634            Compute the new bound for the guarding IV and patch the
 635            loop exit to use it instead of original IV and bound.  */
 636         gimple_seq stmts = NULL;
 637         tree newend = compute_new_first_bound (&stmts, &niter, border,
 638                                                guard_code, guard_init);
 639         if (stmts)
 640           gsi_insert_seq_on_edge_immediate (loop_preheader_edge (loop1),
 641                                             stmts);
 642         tree guard_next = PHI_ARG_DEF_FROM_EDGE (phi, loop_latch_edge (loop1));
 643         patch_loop_exit (loop1, guard_stmt, guard_next, newend, initial_true);
 644
 645         fix_loop_bb_probability (loop1, loop2, true_edge, false_edge);
 646
 647         /* Fix first loop's exit probability after scaling.  */
 648         edge exit_to_latch1;
 649         if (EDGE_SUCC (exit1->src, 0) == exit1)
 650           exit_to_latch1 = EDGE_SUCC (exit1->src, 1);
 651         else
 652           exit_to_latch1 = EDGE_SUCC (exit1->src, 0);
 653         exit_to_latch1->probability *= true_edge->probability;
 654         exit1->probability = exit_to_latch1->probability.invert ();
 655
 656         /* Finally patch out the two copies of the condition to be always
 657            true/false (or opposite).  */
 658         gcond *force_true = as_a<gcond *> (last_stmt (bbs[i]));
 659         gcond *force_false = as_a<gcond *> (last_stmt (get_bb_copy (bbs[i])));
 660         if (!initial_true)
 661           std::swap (force_true, force_false);
 662         gimple_cond_make_true (force_true);
 663         gimple_cond_make_false (force_false);
 664         update_stmt (force_true);
 665         update_stmt (force_false);
 666
 667         free_original_copy_tables ();
 668
 669         changed = true;
 670         if (dump_file && (dump_flags & TDF_DETAILS))
 671           fprintf (dump_file, ";; Loop split.\n");
 672
 673         if (dump_enabled_p ())
 674           dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, guard_stmt, "loop split\n");
 675
 676         /* Only deal with the first opportunity.  */
 677         break;
 678       }
 679
 680   free (bbs);
 681   return changed;
 682 }
 683
 684 /* Another transformation of loops like:
 685
 686    for (i = INIT (); CHECK (i); i = NEXT ())
 687      {
 688        if (expr (a_1, a_2, ..., a_n))  // expr is pure
 689          a_j = ...;  // change at least one a_j
 690        else
 691          S;          // not change any a_j
 692      }
 693
 694    into:
 695
 696    for (i = INIT (); CHECK (i); i = NEXT ())
 697      {
 698        if (expr (a_1, a_2, ..., a_n))
 699          a_j = ...;
 700        else
 701          {
 702            S;
 703            i = NEXT ();
 704            break;
 705          }
 706      }
 707
 708    for (; CHECK (i); i = NEXT ())
 709      {
 710        S;
 711      }
 712
 713    */
 714
 715 /* Data structure to hold temporary information during loop split upon
 716    semi-invariant conditional statement.  */
 717 class split_info {
 718 public:
 719   /* Array of all basic blocks in a loop, returned by get_loop_body().  */
 720   basic_block *bbs;
 721
 722   /* All memory store/clobber statements in a loop.  */
 723   auto_vec<gimple *> memory_stores;
 724
 725   /* Whether above memory stores vector has been filled.  */
 726   int need_init;
 727
 728   /* Control dependencies of basic blocks in a loop.  */
 729   auto_vec<hash_set<basic_block> *> control_deps;
 730
 731   split_info () : bbs (NULL),  need_init (true) { }
 732
 733   ~split_info ()
 734     {
 735       if (bbs)
 736         free (bbs);
 737
 738       for (unsigned i = 0; i < control_deps.length (); i++)
 739         delete control_deps[i];
 740     }
 741 };
 742
 743 /* Find all statements with memory-write effect in LOOP, including memory
 744    store and non-pure function call, and keep those in a vector.  This work
 745    is only done one time, for the vector should be constant during analysis
 746    stage of semi-invariant condition.  */
 747
 748 static void
 749 find_vdef_in_loop (struct loop *loop)
 750 {
 751   split_info *info = (split_info *) loop->aux;
 752   gphi *vphi = get_virtual_phi (loop->header);
 753
 754   /* Indicate memory store vector has been filled.  */
 755   info->need_init = false;
 756
 757   /* If loop contains memory operation, there must be a virtual PHI node in
 758      loop header basic block.  */
 759   if (vphi == NULL)
 760     return;
 761
 762   /* All virtual SSA names inside the loop are connected to be a cyclic
 763      graph via virtual PHI nodes.  The virtual PHI node in loop header just
 764      links the first and the last virtual SSA names, by using the last as
 765      PHI operand to define the first.  */
 766   const edge latch = loop_latch_edge (loop);
 767   const tree first = gimple_phi_result (vphi);
 768   const tree last = PHI_ARG_DEF_FROM_EDGE (vphi, latch);
 769
 770   /* The virtual SSA cyclic graph might consist of only one SSA name, who
 771      is defined by itself.
 772
 773        .MEM_1 = PHI <.MEM_2(loop entry edge), .MEM_1(latch edge)>
 774
 775      This means the loop contains only memory loads, so we can skip it.  */
 776   if (first == last)
 777     return;
 778
 779   auto_vec<gimple *> other_stores;
 780   auto_vec<tree> worklist;
 781   auto_bitmap visited;
 782
 783   bitmap_set_bit (visited, SSA_NAME_VERSION (first));
 784   bitmap_set_bit (visited, SSA_NAME_VERSION (last));
 785   worklist.safe_push (last);
 786
 787   do
 788     {
 789       tree vuse = worklist.pop ();
 790       gimple *stmt = SSA_NAME_DEF_STMT (vuse);
 791
 792       /* We mark the first and last SSA names as visited at the beginning,
 793          and reversely start the process from the last SSA name towards the
 794          first, which ensures that this do-while will not touch SSA names
 795          defined outside the loop.  */
 796       gcc_assert (gimple_bb (stmt)
 797                   && flow_bb_inside_loop_p (loop, gimple_bb (stmt)));
 798
 799       if (gimple_code (stmt) == GIMPLE_PHI)
 800         {
 801           gphi *phi = as_a <gphi *> (stmt);
 802
 803           for (unsigned i = 0; i < gimple_phi_num_args (phi); ++i)
 804             {
 805               tree arg = gimple_phi_arg_def (stmt, i);
 806
 807               if (bitmap_set_bit (visited, SSA_NAME_VERSION (arg)))
 808                 worklist.safe_push (arg);
 809             }
 810         }
 811       else
 812         {
 813           tree prev = gimple_vuse (stmt);
 814
 815           /* Non-pure call statement is conservatively assumed to impact all
 816              memory locations.  So place call statements ahead of other memory
 817              stores in the vector with an idea of using them as shortcut
 818              terminators to memory alias analysis.  */
 819           if (gimple_code (stmt) == GIMPLE_CALL)
 820             info->memory_stores.safe_push (stmt);
 821           else
 822             other_stores.safe_push (stmt);
 823
 824           if (bitmap_set_bit (visited, SSA_NAME_VERSION (prev)))
 825             worklist.safe_push (prev);
 826         }
 827     } while (!worklist.is_empty ());
 828
 829     info->memory_stores.safe_splice (other_stores);
 830 }
 831
 832 /* Two basic blocks have equivalent control dependency if one dominates to
 833    the other, and it is post-dominated by the latter.  Given a basic block
 834    BB in LOOP, find farest equivalent dominating basic block.  For BB, there
 835    is a constraint that BB does not post-dominate loop header of LOOP, this
 836    means BB is control-dependent on at least one basic block in LOOP.  */
 837
 838 static basic_block
 839 get_control_equiv_head_block (struct loop *loop, basic_block bb)
 840 {
 841   while (!bb->aux)
 842     {
 843       basic_block dom_bb = get_immediate_dominator (CDI_DOMINATORS, bb);
 844
 845       gcc_checking_assert (dom_bb && flow_bb_inside_loop_p (loop, dom_bb));
 846
 847       if (!dominated_by_p (CDI_POST_DOMINATORS, dom_bb, bb))
 848         break;
 849
 850       bb = dom_bb;
 851     }
 852   return bb;
 853 }
 854
 855 /* Given a BB in LOOP, find out all basic blocks in LOOP that BB is control-
 856    dependent on.  */
 857
 858 static hash_set<basic_block> *
 859 find_control_dep_blocks (struct loop *loop, basic_block bb)
 860 {
 861   /* BB has same control dependency as loop header, then it is not control-
 862      dependent on any basic block in LOOP.  */
 863   if (dominated_by_p (CDI_POST_DOMINATORS, loop->header, bb))
 864     return NULL;
 865
 866   basic_block equiv_head = get_control_equiv_head_block (loop, bb);
 867
 868   if (equiv_head->aux)
 869     {
 870       /* There is a basic block containing control dependency equivalent
 871          to BB.  No need to recompute that, and also set this information
 872          to other equivalent basic blocks.  */
 873       for (; bb != equiv_head;
 874            bb = get_immediate_dominator (CDI_DOMINATORS, bb))
 875         bb->aux = equiv_head->aux;
 876       return (hash_set<basic_block> *) equiv_head->aux;
 877     }
 878
 879   /* A basic block X is control-dependent on another Y iff there exists
 880      a path from X to Y, in which every basic block other than X and Y
 881      is post-dominated by Y, but X is not post-dominated by Y.
 882
 883      According to this rule, traverse basic blocks in the loop backwards
 884      starting from BB, if a basic block is post-dominated by BB, extend
 885      current post-dominating path to this block, otherwise it is another
 886      one that BB is control-dependent on.  */
 887
 888   auto_vec<basic_block> pdom_worklist;
 889   hash_set<basic_block> pdom_visited;
 890   hash_set<basic_block> *dep_bbs = new hash_set<basic_block>;
 891
 892   pdom_worklist.safe_push (equiv_head);
 893
 894   do
 895     {
 896       basic_block pdom_bb = pdom_worklist.pop ();
 897       edge_iterator ei;
 898       edge e;
 899
 900       if (pdom_visited.add (pdom_bb))
 901         continue;
 902
 903       FOR_EACH_EDGE (e, ei, pdom_bb->preds)
 904         {
 905           basic_block pred_bb = e->src;
 906
 907           if (!dominated_by_p (CDI_POST_DOMINATORS, pred_bb, bb))
 908             {
 909               dep_bbs->add (pred_bb);
 910               continue;
 911             }
 912
 913           pred_bb = get_control_equiv_head_block (loop, pred_bb);
 914
 915           if (pdom_visited.contains (pred_bb))
 916             continue;
 917
 918           if (!pred_bb->aux)
 919             {
 920               pdom_worklist.safe_push (pred_bb);
 921               continue;
 922             }
 923
 924           /* If control dependency of basic block is available, fast extend
 925              post-dominating path using the information instead of advancing
 926              forward step-by-step.  */
 927           hash_set<basic_block> *pred_dep_bbs
 928                         = (hash_set<basic_block> *) pred_bb->aux;
 929
 930           for (hash_set<basic_block>::iterator iter = pred_dep_bbs->begin ();
 931                iter != pred_dep_bbs->end (); ++iter)
 932             {
 933               basic_block pred_dep_bb = *iter;
 934
 935               /* Basic blocks can either be in control dependency of BB, or
 936                  must be post-dominated by BB, if so, extend the path from
 937                  these basic blocks.  */
 938               if (!dominated_by_p (CDI_POST_DOMINATORS, pred_dep_bb, bb))
 939                 dep_bbs->add (pred_dep_bb);
 940               else if (!pdom_visited.contains (pred_dep_bb))
 941                 pdom_worklist.safe_push (pred_dep_bb);
 942             }
 943         }
 944     } while (!pdom_worklist.is_empty ());
 945
 946   /* Record computed control dependencies in loop so that we can reach them
 947      when reclaiming resources.  */
 948   ((split_info *) loop->aux)->control_deps.safe_push (dep_bbs);
 949
 950   /* Associate control dependence with related equivalent basic blocks.  */
 951   for (equiv_head->aux = dep_bbs; bb != equiv_head;
 952        bb = get_immediate_dominator (CDI_DOMINATORS, bb))
 953     bb->aux = dep_bbs;
 954
 955   return dep_bbs;
 956 }
 957
 958 /* Forward declaration */
 959
 960 static bool
 961 stmt_semi_invariant_p_1 (struct loop *loop, gimple *stmt,
 962                          const_basic_block skip_head,
 963                          hash_map<gimple *, bool> &stmt_stat);
 964
 965 /* Given STMT, memory load or pure call statement, check whether it is impacted
 966    by some memory store in LOOP, excluding trace starting from SKIP_HEAD (the
 967    trace is composed of SKIP_HEAD and those basic block dominated by it, always
 968    corresponds to one branch of a conditional statement).  If SKIP_HEAD is
 969    NULL, all basic blocks of LOOP are checked.  */
 970
 971 static bool
 972 vuse_semi_invariant_p (struct loop *loop, gimple *stmt,
 973                        const_basic_block skip_head)
 974 {
 975   split_info *info = (split_info *) loop->aux;
 976   tree rhs = NULL_TREE;
 977   ao_ref ref;
 978   gimple *store;
 979   unsigned i;
 980
 981   /* Collect memory store/clobber statements if haven't done that.  */
 982   if (info->need_init)
 983     find_vdef_in_loop (loop);
 984
 985   if (is_gimple_assign (stmt))
 986     rhs = gimple_assign_rhs1 (stmt);
 987
 988   ao_ref_init (&ref, rhs);
 989
 990   FOR_EACH_VEC_ELT (info->memory_stores, i, store)
 991     {
 992       /* Skip basic blocks dominated by SKIP_HEAD, if non-NULL.  */
 993       if (skip_head
 994           && dominated_by_p (CDI_DOMINATORS, gimple_bb (store), skip_head))
 995         continue;
 996
 997       if (!ref.ref || stmt_may_clobber_ref_p_1 (store, &ref))
 998         return false;
 999     }
1000
1001   return true;
1002 }
1003
1004 /* Suppose one condition branch, led by SKIP_HEAD, is not executed since
1005    certain iteration of LOOP, check whether an SSA name (NAME) remains
1006    unchanged in next iteration.  We call this characteristic semi-
1007    invariantness.  SKIP_HEAD might be NULL, if so, nothing excluded, all basic
1008    blocks and control flows in the loop will be considered.  Semi-invariant
1009    state of checked statement is cached in hash map STMT_STAT to avoid
1010    redundant computation in possible following re-check.  */
1011
1012 static inline bool
1013 ssa_semi_invariant_p (struct loop *loop, tree name,
1014                       const_basic_block skip_head,
1015                       hash_map<gimple *, bool> &stmt_stat)
1016 {
1017   gimple *def = SSA_NAME_DEF_STMT (name);
1018   const_basic_block def_bb = gimple_bb (def);
1019
1020   /* An SSA name defined outside loop is definitely semi-invariant.  */
1021   if (!def_bb || !flow_bb_inside_loop_p (loop, def_bb))
1022     return true;
1023
1024   if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name))
1025     return false;
1026
1027   return stmt_semi_invariant_p_1 (loop, def, skip_head, stmt_stat);
1028 }
1029
1030 /* Check whether a loop iteration PHI node (LOOP_PHI) defines a value that is
1031    semi-invariant in LOOP.  Basic blocks dominated by SKIP_HEAD (if non-NULL),
1032    are excluded from LOOP.  */
1033
1034 static bool
1035 loop_iter_phi_semi_invariant_p (struct loop *loop, gphi *loop_phi,
1036                                 const_basic_block skip_head)
1037 {
1038   const_edge latch = loop_latch_edge (loop);
1039   tree name = gimple_phi_result (loop_phi);
1040   tree from = PHI_ARG_DEF_FROM_EDGE (loop_phi, latch);
1041
1042   gcc_checking_assert (from);
1043
1044   /* Loop iteration PHI node locates in loop header, and it has two source
1045      operands, one is an initial value coming from outside the loop, the other
1046      is a value through latch of the loop, which is derived in last iteration,
1047      we call the latter latch value.  From the PHI node to definition of latch
1048      value, if excluding branch trace starting from SKIP_HEAD, except copy-
1049      assignment or likewise, there is no other kind of value redefinition, SSA
1050      name defined by the PHI node is semi-invariant.
1051
1052                          loop entry
1053                               |     .--- latch ---.
1054                               |     |             |
1055                               v     v             |
1056                   x_1 = PHI <x_0,  x_3>           |
1057                            |                      |
1058                            v                      |
1059               .------- if (cond) -------.         |
1060               |                         |         |
1061               |                     [ SKIP ]      |
1062               |                         |         |
1063               |                     x_2 = ...     |
1064               |                         |         |
1065               '---- T ---->.<---- F ----'         |
1066                            |                      |
1067                            v                      |
1068                   x_3 = PHI <x_1, x_2>            |
1069                            |                      |
1070                            '----------------------'
1071
1072      Suppose in certain iteration, execution flow in above graph goes through
1073      true branch, which means that one source value to define x_3 in false
1074      branch (x_2) is skipped, x_3 only comes from x_1, and x_1 in next
1075      iterations is defined by x_3, we know that x_1 will never changed if COND
1076      always chooses true branch from then on.  */
1077
1078   while (from != name)
1079     {
1080       /* A new value comes from a CONSTANT.  */
1081       if (TREE_CODE (from) != SSA_NAME)
1082         return false;
1083
1084       gimple *stmt = SSA_NAME_DEF_STMT (from);
1085       const_basic_block bb = gimple_bb (stmt);
1086
1087       /* A new value comes from outside the loop.  */
1088       if (!bb || !flow_bb_inside_loop_p (loop, bb))
1089         return false;
1090
1091       from = NULL_TREE;
1092
1093       if (gimple_code (stmt) == GIMPLE_PHI)
1094         {
1095           gphi *phi = as_a <gphi *> (stmt);
1096
1097           for (unsigned i = 0; i < gimple_phi_num_args (phi); ++i)
1098             {
1099               if (skip_head)
1100                 {
1101                   const_edge e = gimple_phi_arg_edge (phi, i);
1102
1103                   /* Don't consider redefinitions in excluded basic blocks.  */
1104                   if (dominated_by_p (CDI_DOMINATORS, e->src, skip_head))
1105                     continue;
1106                 }
1107
1108               tree arg = gimple_phi_arg_def (phi, i);
1109
1110               if (!from)
1111                 from = arg;
1112               else if (!operand_equal_p (from, arg, 0))
1113                 /* There are more than one source operands that provide
1114                    different values to the SSA name, it is variant.  */
1115                 return false;
1116             }
1117         }
1118       else if (gimple_code (stmt) == GIMPLE_ASSIGN)
1119         {
1120           /* For simple value copy, check its rhs instead.  */
1121           if (gimple_assign_ssa_name_copy_p (stmt))
1122             from = gimple_assign_rhs1 (stmt);
1123         }
1124
1125       /* Any other kind of definition is deemed to introduce a new value
1126          to the SSA name.  */
1127       if (!from)
1128         return false;
1129     }
1130   return true;
1131 }
1132
1133 /* Check whether conditional predicates that BB is control-dependent on, are
1134    semi-invariant in LOOP.  Basic blocks dominated by SKIP_HEAD (if non-NULL),
1135    are excluded from LOOP.  Semi-invariant state of checked statement is cached
1136    in hash map STMT_STAT.  */
1137
1138 static bool
1139 control_dep_semi_invariant_p (struct loop *loop, basic_block bb,
1140                               const_basic_block skip_head,
1141                               hash_map<gimple *, bool> &stmt_stat)
1142 {
1143   hash_set<basic_block> *dep_bbs = find_control_dep_blocks (loop, bb);
1144
1145   if (!dep_bbs)
1146     return true;
1147
1148   for (hash_set<basic_block>::iterator iter = dep_bbs->begin ();
1149        iter != dep_bbs->end (); ++iter)
1150     {
1151       gimple *last = last_stmt (*iter);
1152
1153       if (!last)
1154         return false;
1155
1156       /* Only check condition predicates.  */
1157       if (gimple_code (last) != GIMPLE_COND
1158           && gimple_code (last) != GIMPLE_SWITCH)
1159         return false;
1160
1161       if (!stmt_semi_invariant_p_1 (loop, last, skip_head, stmt_stat))
1162         return false;
1163     }
1164
1165   return true;
1166 }
1167
1168 /* Check whether STMT is semi-invariant in LOOP, iff all its operands are
1169    semi-invariant, consequently, all its defined values are semi-invariant.
1170    Basic blocks dominated by SKIP_HEAD (if non-NULL), are excluded from LOOP.
1171    Semi-invariant state of checked statement is cached in hash map
1172    STMT_STAT.  */
1173
1174 static bool
1175 stmt_semi_invariant_p_1 (struct loop *loop, gimple *stmt,
1176                          const_basic_block skip_head,
1177                          hash_map<gimple *, bool> &stmt_stat)
1178 {
1179   bool existed;
1180   bool &invar = stmt_stat.get_or_insert (stmt, &existed);
1181
1182   if (existed)
1183     return invar;
1184
1185   /* A statement might depend on itself, which is treated as variant.  So set
1186      state of statement under check to be variant to ensure that.  */
1187   invar = false;
1188
1189   if (gimple_code (stmt) == GIMPLE_PHI)
1190     {
1191       gphi *phi = as_a <gphi *> (stmt);
1192
1193       if (gimple_bb (stmt) == loop->header)
1194         {
1195           /* If the entry value is subject to abnormal coalescing
1196              avoid the transform since we're going to duplicate the
1197              loop header and thus likely introduce overlapping life-ranges
1198              between the PHI def and the entry on the path when the
1199              first loop is skipped.  */
1200           tree entry_def
1201             = PHI_ARG_DEF_FROM_EDGE (phi, loop_preheader_edge (loop));
1202           if (TREE_CODE (entry_def) == SSA_NAME
1203               && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (entry_def))
1204             return false;
1205           invar = loop_iter_phi_semi_invariant_p (loop, phi, skip_head);
1206           return invar;
1207         }
1208
1209       /* For a loop PHI node that does not locate in loop header, it is semi-
1210          invariant only if two conditions are met.  The first is its source
1211          values are derived from CONSTANT (including loop-invariant value), or
1212          from SSA name defined by semi-invariant loop iteration PHI node.  The
1213          second is its source incoming edges are control-dependent on semi-
1214          invariant conditional predicates.  */
1215       for (unsigned i = 0; i < gimple_phi_num_args (phi); ++i)
1216         {
1217           const_edge e = gimple_phi_arg_edge (phi, i);
1218           tree arg = gimple_phi_arg_def (phi, i);
1219
1220           if (TREE_CODE (arg) == SSA_NAME)
1221             {
1222               if (!ssa_semi_invariant_p (loop, arg, skip_head, stmt_stat))
1223                 return false;
1224
1225               /* If source value is defined in location from where the source
1226                  edge comes in, no need to check control dependency again
1227                  since this has been done in above SSA name check stage.  */
1228               if (e->src == gimple_bb (SSA_NAME_DEF_STMT (arg)))
1229                 continue;
1230             }
1231
1232           if (!control_dep_semi_invariant_p (loop, e->src, skip_head,
1233                                              stmt_stat))
1234             return false;
1235         }
1236     }
1237   else
1238     {
1239       ssa_op_iter iter;
1240       tree use;
1241
1242       /* Volatile memory load or return of normal (non-const/non-pure) call
1243          should not be treated as constant in each iteration of loop.  */
1244       if (gimple_has_side_effects (stmt))
1245         return false;
1246
1247       /* Check if any memory store may kill memory load at this place.  */
1248       if (gimple_vuse (stmt) && !vuse_semi_invariant_p (loop, stmt, skip_head))
1249         return false;
1250
1251       /* Although operand of a statement might be SSA name, CONSTANT or
1252          VARDECL, here we only need to check SSA name operands.  This is
1253          because check on VARDECL operands, which involve memory loads,
1254          must have been done prior to invocation of this function in
1255          vuse_semi_invariant_p.  */
1256       FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
1257         if (!ssa_semi_invariant_p (loop, use, skip_head, stmt_stat))
1258           return false;
1259     }
1260
1261   if (!control_dep_semi_invariant_p (loop, gimple_bb (stmt), skip_head,
1262                                      stmt_stat))
1263     return false;
1264
1265   /* Here we SHOULD NOT use invar = true, since hash map might be changed due
1266      to new insertion, and thus invar may point to invalid memory.  */
1267   stmt_stat.put (stmt, true);
1268   return true;
1269 }
1270
1271 /* A helper function to check whether STMT is semi-invariant in LOOP.  Basic
1272    blocks dominated by SKIP_HEAD (if non-NULL), are excluded from LOOP.  */
1273
1274 static bool
1275 stmt_semi_invariant_p (struct loop *loop, gimple *stmt,
1276                        const_basic_block skip_head)
1277 {
1278   hash_map<gimple *, bool> stmt_stat;
1279   return stmt_semi_invariant_p_1 (loop, stmt, skip_head, stmt_stat);
1280 }
1281
1282 /* Determine when conditional statement never transfers execution to one of its
1283    branch, whether we can remove the branch's leading basic block (BRANCH_BB)
1284    and those basic blocks dominated by BRANCH_BB.  */
1285
1286 static bool
1287 branch_removable_p (basic_block branch_bb)
1288 {
1289   edge_iterator ei;
1290   edge e;
1291
1292   if (single_pred_p (branch_bb))
1293     return true;
1294
1295   FOR_EACH_EDGE (e, ei, branch_bb->preds)
1296     {
1297       if (dominated_by_p (CDI_DOMINATORS, e->src, branch_bb))
1298         continue;
1299
1300       if (dominated_by_p (CDI_DOMINATORS, branch_bb, e->src))
1301         continue;
1302
1303        /* The branch can be reached from opposite branch, or from some
1304           statement not dominated by the conditional statement.  */
1305       return false;
1306     }
1307
1308   return true;
1309 }
1310
1311 /* Find out which branch of a conditional statement (COND) is invariant in the
1312    execution context of LOOP.  That is: once the branch is selected in certain
1313    iteration of the loop, any operand that contributes to computation of the
1314    conditional statement remains unchanged in all following iterations.  */
1315
1316 static edge
1317 get_cond_invariant_branch (struct loop *loop, gcond *cond)
1318 {
1319   basic_block cond_bb = gimple_bb (cond);
1320   basic_block targ_bb[2];
1321   bool invar[2];
1322   unsigned invar_checks = 0;
1323
1324   for (unsigned i = 0; i < 2; i++)
1325     {
1326       targ_bb[i] = EDGE_SUCC (cond_bb, i)->dest;
1327
1328       /* One branch directs to loop exit, no need to perform loop split upon
1329          this conditional statement.  Firstly, it is trivial if the exit branch
1330          is semi-invariant, for the statement is just to break loop.  Secondly,
1331          if the opposite branch is semi-invariant, it means that the statement
1332          is real loop-invariant, which is covered by loop unswitch.  */
1333       if (!flow_bb_inside_loop_p (loop, targ_bb[i]))
1334         return NULL;
1335     }
1336
1337   for (unsigned i = 0; i < 2; i++)
1338     {
1339       invar[!i] = false;
1340
1341       if (!branch_removable_p (targ_bb[i]))
1342         continue;
1343
1344       /* Given a semi-invariant branch, if its opposite branch dominates
1345          loop latch, it and its following trace will only be executed in
1346          final iteration of loop, namely it is not part of repeated body
1347          of the loop.  Similar to the above case that the branch is loop
1348          exit, no need to split loop.  */
1349       if (dominated_by_p (CDI_DOMINATORS, loop->latch, targ_bb[i]))
1350         continue;
1351
1352       invar[!i] = stmt_semi_invariant_p (loop, cond, targ_bb[i]);
1353       invar_checks++;
1354     }
1355
1356   /* With both branches being invariant (handled by loop unswitch) or
1357      variant is not what we want.  */
1358   if (invar[0] ^ !invar[1])
1359     return NULL;
1360
1361   /* Found a real loop-invariant condition, do nothing.  */
1362   if (invar_checks < 2 && stmt_semi_invariant_p (loop, cond, NULL))
1363     return NULL;
1364
1365   return EDGE_SUCC (cond_bb, invar[0] ? 0 : 1);
1366 }
1367
1368 /* Calculate increased code size measured by estimated insn number if applying
1369    loop split upon certain branch (BRANCH_EDGE) of a conditional statement.  */
1370
1371 static int
1372 compute_added_num_insns (struct loop *loop, const_edge branch_edge)
1373 {
1374   basic_block cond_bb = branch_edge->src;
1375   unsigned branch = EDGE_SUCC (cond_bb, 1) == branch_edge;
1376   basic_block opposite_bb = EDGE_SUCC (cond_bb, !branch)->dest;
1377   basic_block *bbs = ((split_info *) loop->aux)->bbs;
1378   int num = 0;
1379
1380   for (unsigned i = 0; i < loop->num_nodes; i++)
1381     {
1382       /* Do no count basic blocks only in opposite branch.  */
1383       if (dominated_by_p (CDI_DOMINATORS, bbs[i], opposite_bb))
1384         continue;
1385
1386       num += estimate_num_insns_seq (bb_seq (bbs[i]), &eni_size_weights);
1387     }
1388
1389   /* It is unnecessary to evaluate expression of the conditional statement
1390      in new loop that contains only invariant branch.  This expression should
1391      be constant value (either true or false).  Exclude code size of insns
1392      that contribute to computation of the expression.  */
1393
1394   auto_vec<gimple *> worklist;
1395   hash_set<gimple *> removed;
1396   gimple *stmt = last_stmt (cond_bb);
1397
1398   worklist.safe_push (stmt);
1399   removed.add (stmt);
1400   num -= estimate_num_insns (stmt, &eni_size_weights);
1401
1402   do
1403     {
1404       ssa_op_iter opnd_iter;
1405       use_operand_p opnd_p;
1406
1407       stmt = worklist.pop ();
1408       FOR_EACH_PHI_OR_STMT_USE (opnd_p, stmt, opnd_iter, SSA_OP_USE)
1409         {
1410           tree opnd = USE_FROM_PTR (opnd_p);
1411
1412           if (TREE_CODE (opnd) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (opnd))
1413             continue;
1414
1415           gimple *opnd_stmt = SSA_NAME_DEF_STMT (opnd);
1416           use_operand_p use_p;
1417           imm_use_iterator use_iter;
1418
1419           if (removed.contains (opnd_stmt)
1420               || !flow_bb_inside_loop_p (loop, gimple_bb (opnd_stmt)))
1421             continue;
1422
1423           FOR_EACH_IMM_USE_FAST (use_p, use_iter, opnd)
1424             {
1425               gimple *use_stmt = USE_STMT (use_p);
1426
1427               if (!is_gimple_debug (use_stmt) && !removed.contains (use_stmt))
1428                 {
1429                   opnd_stmt = NULL;
1430                   break;
1431                 }
1432             }
1433
1434           if (opnd_stmt)
1435             {
1436               worklist.safe_push (opnd_stmt);
1437               removed.add (opnd_stmt);
1438               num -= estimate_num_insns (opnd_stmt, &eni_size_weights);
1439             }
1440         }
1441     } while (!worklist.is_empty ());
1442
1443   gcc_assert (num >= 0);
1444   return num;
1445 }
1446
1447 /* Find out loop-invariant branch of a conditional statement (COND) if it has,
1448    and check whether it is eligible and profitable to perform loop split upon
1449    this branch in LOOP.  */
1450
1451 static edge
1452 get_cond_branch_to_split_loop (struct loop *loop, gcond *cond)
1453 {
1454   edge invar_branch = get_cond_invariant_branch (loop, cond);
1455   if (!invar_branch)
1456     return NULL;
1457
1458   /* When accurate profile information is available, and execution
1459      frequency of the branch is too low, just let it go.  */
1460   profile_probability prob = invar_branch->probability;
1461   if (prob.reliable_p ())
1462     {
1463       int thres = param_min_loop_cond_split_prob;
1464
1465       if (prob < profile_probability::always ().apply_scale (thres, 100))
1466         return NULL;
1467     }
1468
1469   /* Add a threshold for increased code size to disable loop split.  */
1470   if (compute_added_num_insns (loop, invar_branch) > param_max_peeled_insns)
1471     return NULL;
1472
1473   return invar_branch;
1474 }
1475
1476 /* Given a loop (LOOP1) with a loop-invariant branch (INVAR_BRANCH) of some
1477    conditional statement, perform loop split transformation illustrated
1478    as the following graph.
1479
1480                .-------T------ if (true) ------F------.
1481                |                    .---------------. |
1482                |                    |               | |
1483                v                    |               v v
1484           pre-header                |            pre-header
1485                | .------------.     |                 | .------------.
1486                | |            |     |                 | |            |
1487                | v            |     |                 | v            |
1488              header           |     |               header           |
1489                |              |     |                 |              |
1490       .--- if (cond) ---.     |     |        .--- if (true) ---.     |
1491       |                 |     |     |        |                 |     |
1492   invariant             |     |     |    invariant             |     |
1493       |                 |     |     |        |                 |     |
1494       '---T--->.<---F---'     |     |        '---T--->.<---F---'     |
1495                |              |    /                  |              |
1496              stmts            |   /                 stmts            |
1497                |              F  T                    |              |
1498               / \             | /                    / \             |
1499      .-------*   *      [ if (cond) ]       .-------*   *            |
1500      |           |            |             |           |            |
1501      |         latch          |             |         latch          |
1502      |           |            |             |           |            |
1503      |           '------------'             |           '------------'
1504      '------------------------. .-----------'
1505              loop1            | |                   loop2
1506                               v v
1507                              exits
1508
1509    In the graph, loop1 represents the part derived from original one, and
1510    loop2 is duplicated using loop_version (), which corresponds to the part
1511    of original one being splitted out.  In original latch edge of loop1, we
1512    insert a new conditional statement duplicated from the semi-invariant cond,
1513    and one of its branch goes back to loop1 header as a latch edge, and the
1514    other branch goes to loop2 pre-header as an entry edge.  And also in loop2,
1515    we abandon the variant branch of the conditional statement by setting a
1516    constant bool condition, based on which branch is semi-invariant.  */
1517
1518 static bool
1519 do_split_loop_on_cond (struct loop *loop1, edge invar_branch)
1520 {
1521   basic_block cond_bb = invar_branch->src;
1522   bool true_invar = !!(invar_branch->flags & EDGE_TRUE_VALUE);
1523   gcond *cond = as_a <gcond *> (last_stmt (cond_bb));
1524
1525   gcc_assert (cond_bb->loop_father == loop1);
1526
1527   if (dump_enabled_p ())
1528     dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, cond,
1529                      "loop split on semi-invariant condition at %s branch\n",
1530                      true_invar ? "true" : "false");
1531
1532   initialize_original_copy_tables ();
1533
1534   struct loop *loop2 = loop_version (loop1, boolean_true_node, NULL,
1535                                      invar_branch->probability.invert (),
1536                                      invar_branch->probability,
1537                                      profile_probability::always (),
1538                                      profile_probability::always (),
1539                                      true);
1540   if (!loop2)
1541     {
1542       free_original_copy_tables ();
1543       return false;
1544     }
1545
1546   basic_block cond_bb_copy = get_bb_copy (cond_bb);
1547   gcond *cond_copy = as_a<gcond *> (last_stmt (cond_bb_copy));
1548
1549   /* Replace the condition in loop2 with a bool constant to let PassManager
1550      remove the variant branch after current pass completes.  */
1551   if (true_invar)
1552     gimple_cond_make_true (cond_copy);
1553   else
1554     gimple_cond_make_false (cond_copy);
1555
1556   update_stmt (cond_copy);
1557
1558   /* Insert a new conditional statement on latch edge of loop1, its condition
1559      is duplicated from the semi-invariant.  This statement acts as a switch
1560      to transfer execution from loop1 to loop2, when loop1 enters into
1561      invariant state.  */
1562   basic_block latch_bb = split_edge (loop_latch_edge (loop1));
1563   basic_block break_bb = split_edge (single_pred_edge (latch_bb));
1564   gimple *break_cond = gimple_build_cond (gimple_cond_code(cond),
1565                                           gimple_cond_lhs (cond),
1566                                           gimple_cond_rhs (cond),
1567                                           NULL_TREE, NULL_TREE);
1568
1569   gimple_stmt_iterator gsi = gsi_last_bb (break_bb);
1570   gsi_insert_after (&gsi, break_cond, GSI_NEW_STMT);
1571
1572   edge to_loop1 = single_succ_edge (break_bb);
1573   edge to_loop2 = make_edge (break_bb, loop_preheader_edge (loop2)->src, 0);
1574
1575   to_loop1->flags &= ~EDGE_FALLTHRU;
1576   to_loop1->flags |= true_invar ? EDGE_FALSE_VALUE : EDGE_TRUE_VALUE;
1577   to_loop2->flags |= true_invar ? EDGE_TRUE_VALUE : EDGE_FALSE_VALUE;
1578
1579   /* Due to introduction of a control flow edge from loop1 latch to loop2
1580      pre-header, we should update PHIs in loop2 to reflect this connection
1581      between loop1 and loop2.  */
1582   connect_loop_phis (loop1, loop2, to_loop2);
1583
1584   edge true_edge, false_edge, skip_edge1, skip_edge2;
1585   extract_true_false_edges_from_block (cond_bb, &true_edge, &false_edge);
1586
1587   skip_edge1 = true_invar ? false_edge : true_edge;
1588   skip_edge2 = true_invar ? true_edge : false_edge;
1589   fix_loop_bb_probability (loop1, loop2, skip_edge1, skip_edge2);
1590
1591   /* Fix first loop's exit probability after scaling.  */
1592   to_loop1->probability = invar_branch->probability.invert ();
1593   to_loop2->probability = invar_branch->probability;
1594
1595   free_original_copy_tables ();
1596
1597   return true;
1598 }
1599
1600 /* Traverse all conditional statements in LOOP, to find out a good candidate
1601    upon which we can do loop split.  */
1602
1603 static bool
1604 split_loop_on_cond (struct loop *loop)
1605 {
1606   split_info *info = new split_info ();
1607   basic_block *bbs = info->bbs = get_loop_body (loop);
1608   bool do_split = false;
1609
1610   /* Allocate an area to keep temporary info, and associate its address
1611      with loop aux field.  */
1612   loop->aux = info;
1613
1614   for (unsigned i = 0; i < loop->num_nodes; i++)
1615     bbs[i]->aux = NULL;
1616
1617   for (unsigned i = 0; i < loop->num_nodes; i++)
1618     {
1619       basic_block bb = bbs[i];
1620
1621       /* We only consider conditional statement, which be executed at most once
1622          in each iteration of the loop.  So skip statements in inner loops.  */
1623       if ((bb->loop_father != loop) || (bb->flags & BB_IRREDUCIBLE_LOOP))
1624         continue;
1625
1626       /* Actually this check is not a must constraint.  With it, we can ensure
1627          conditional statement will always be executed in each iteration.  */
1628       if (!dominated_by_p (CDI_DOMINATORS, loop->latch, bb))
1629         continue;
1630
1631       gimple *last = last_stmt (bb);
1632
1633       if (!last || gimple_code (last) != GIMPLE_COND)
1634         continue;
1635
1636       gcond *cond = as_a <gcond *> (last);
1637       edge branch_edge = get_cond_branch_to_split_loop (loop, cond);
1638
1639       if (branch_edge)
1640         {
1641           do_split_loop_on_cond (loop, branch_edge);
1642           do_split = true;
1643           break;
1644         }
1645     }
1646
1647   delete info;
1648   loop->aux = NULL;
1649
1650   return do_split;
1651 }
1652
1653 /* Main entry point.  Perform loop splitting on all suitable loops.  */
1654
1655 static unsigned int
1656 tree_ssa_split_loops (void)
1657 {
1658   bool changed = false;
1659
1660   gcc_assert (scev_initialized_p ());
1661
1662   calculate_dominance_info (CDI_POST_DOMINATORS);
1663
1664   for (auto loop : loops_list (cfun, LI_INCLUDE_ROOT))
1665     loop->aux = NULL;
1666
1667   /* Go through all loops starting from innermost.  */
1668   for (auto loop : loops_list (cfun, LI_FROM_INNERMOST))
1669     {
1670       if (loop->aux)
1671         {
1672           /* If any of our inner loops was split, don't split us,
1673              and mark our containing loop as having had splits as well.
1674              This allows for delaying SSA update.  */
1675           loop_outer (loop)->aux = loop;
1676           continue;
1677         }
1678
1679       if (optimize_loop_for_size_p (loop))
1680         continue;
1681
1682       if (split_loop (loop) || split_loop_on_cond (loop))
1683         {
1684           /* Mark our containing loop as having had some split inner loops.  */
1685           loop_outer (loop)->aux = loop;
1686           changed = true;
1687         }
1688     }
1689
1690   for (auto loop : loops_list (cfun, LI_INCLUDE_ROOT))
1691     loop->aux = NULL;
1692
1693   clear_aux_for_blocks ();
1694
1695   free_dominance_info (CDI_POST_DOMINATORS);
1696
1697   if (changed)
1698     {
1699       rewrite_into_loop_closed_ssa (NULL, TODO_update_ssa);
1700       return TODO_cleanup_cfg;
1701     }
1702   return 0;
1703 }
1704
1705 /* Loop splitting pass.  */
1706
1707 namespace {
1708
1709 const pass_data pass_data_loop_split =
1710 {
1711   GIMPLE_PASS, /* type */
1712   "lsplit", /* name */
1713   OPTGROUP_LOOP, /* optinfo_flags */
1714   TV_LOOP_SPLIT, /* tv_id */
1715   PROP_cfg, /* properties_required */
1716   0, /* properties_provided */
1717   0, /* properties_destroyed */
1718   0, /* todo_flags_start */
1719   0, /* todo_flags_finish */
1720 };
1721
1722 class pass_loop_split : public gimple_opt_pass
1723 {
1724 public:
1725   pass_loop_split (gcc::context *ctxt)
1726     : gimple_opt_pass (pass_data_loop_split, ctxt)
1727   {}
1728
1729   /* opt_pass methods: */
1730   bool gate (function *) final override { return flag_split_loops != 0; }
1731   unsigned int execute (function *) final override;
1732
1733 }; // class pass_loop_split
1734
1735 unsigned int
1736 pass_loop_split::execute (function *fun)
1737 {
1738   if (number_of_loops (fun) <= 1)
1739     return 0;
1740
1741   return tree_ssa_split_loops ();
1742 }
1743
1744 } // anon namespace
1745
1746 gimple_opt_pass *
1747 make_pass_loop_split (gcc::context *ctxt)
1748 {
1749   return new pass_loop_split (ctxt);
1750 }