gcc/predict.c

   1 /* Branch prediction routines for the GNU compiler.
   2    Copyright (C) 2000-2018 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 /* References:
  21
  22    [1] "Branch Prediction for Free"
  23        Ball and Larus; PLDI '93.
  24    [2] "Static Branch Frequency and Program Profile Analysis"
  25        Wu and Larus; MICRO-27.
  26    [3] "Corpus-based Static Branch Prediction"
  27        Calder, Grunwald, Lindsay, Martin, Mozer, and Zorn; PLDI '95.  */
  28
  29
  30 #include "config.h"
  31 #include "system.h"
  32 #include "coretypes.h"
  33 #include "backend.h"
  34 #include "rtl.h"
  35 #include "tree.h"
  36 #include "gimple.h"
  37 #include "cfghooks.h"
  38 #include "tree-pass.h"
  39 #include "ssa.h"
  40 #include "memmodel.h"
  41 #include "emit-rtl.h"
  42 #include "cgraph.h"
  43 #include "coverage.h"
  44 #include "diagnostic-core.h"
  45 #include "gimple-predict.h"
  46 #include "fold-const.h"
  47 #include "calls.h"
  48 #include "cfganal.h"
  49 #include "profile.h"
  50 #include "sreal.h"
  51 #include "params.h"
  52 #include "cfgloop.h"
  53 #include "gimple-iterator.h"
  54 #include "tree-cfg.h"
  55 #include "tree-ssa-loop-niter.h"
  56 #include "tree-ssa-loop.h"
  57 #include "tree-scalar-evolution.h"
  58 #include "ipa-utils.h"
  59 #include "gimple-pretty-print.h"
  60 #include "selftest.h"
  61 #include "cfgrtl.h"
  62 #include "stringpool.h"
  63 #include "attribs.h"
  64
  65 /* Enum with reasons why a predictor is ignored.  */
  66
  67 enum predictor_reason
  68 {
  69   REASON_NONE,
  70   REASON_IGNORED,
  71   REASON_SINGLE_EDGE_DUPLICATE,
  72   REASON_EDGE_PAIR_DUPLICATE
  73 };
  74
  75 /* String messages for the aforementioned enum.  */
  76
  77 static const char *reason_messages[] = {"", " (ignored)",
  78     " (single edge duplicate)", " (edge pair duplicate)"};
  79
  80 /* real constants: 0, 1, 1-1/REG_BR_PROB_BASE, REG_BR_PROB_BASE,
  81                    1/REG_BR_PROB_BASE, 0.5, BB_FREQ_MAX.  */
  82 static sreal real_almost_one, real_br_prob_base,
  83              real_inv_br_prob_base, real_one_half, real_bb_freq_max;
  84
  85 static void combine_predictions_for_insn (rtx_insn *, basic_block);
  86 static void dump_prediction (FILE *, enum br_predictor, int, basic_block,
  87                              enum predictor_reason, edge);
  88 static void predict_paths_leading_to (basic_block, enum br_predictor,
  89                                       enum prediction,
  90                                       struct loop *in_loop = NULL);
  91 static void predict_paths_leading_to_edge (edge, enum br_predictor,
  92                                            enum prediction,
  93                                            struct loop *in_loop = NULL);
  94 static bool can_predict_insn_p (const rtx_insn *);
  95 static HOST_WIDE_INT get_predictor_value (br_predictor, HOST_WIDE_INT);
  96
  97 /* Information we hold about each branch predictor.
  98    Filled using information from predict.def.  */
  99
 100 struct predictor_info
 101 {
 102   const char *const name;       /* Name used in the debugging dumps.  */
 103   const int hitrate;            /* Expected hitrate used by
 104                                    predict_insn_def call.  */
 105   const int flags;
 106 };
 107
 108 /* Use given predictor without Dempster-Shaffer theory if it matches
 109    using first_match heuristics.  */
 110 #define PRED_FLAG_FIRST_MATCH 1
 111
 112 /* Recompute hitrate in percent to our representation.  */
 113
 114 #define HITRATE(VAL) ((int) ((VAL) * REG_BR_PROB_BASE + 50) / 100)
 115
 116 #define DEF_PREDICTOR(ENUM, NAME, HITRATE, FLAGS) {NAME, HITRATE, FLAGS},
 117 static const struct predictor_info predictor_info[]= {
 118 #include "predict.def"
 119
 120   /* Upper bound on predictors.  */
 121   {NULL, 0, 0}
 122 };
 123 #undef DEF_PREDICTOR
 124
 125 static gcov_type min_count = -1;
 126
 127 /* Determine the threshold for hot BB counts.  */
 128
 129 gcov_type
 130 get_hot_bb_threshold ()
 131 {
 132   gcov_working_set_t *ws;
 133   if (min_count == -1)
 134     {
 135       ws = find_working_set (PARAM_VALUE (HOT_BB_COUNT_WS_PERMILLE));
 136       gcc_assert (ws);
 137       min_count = ws->min_counter;
 138     }
 139   return min_count;
 140 }
 141
 142 /* Set the threshold for hot BB counts.  */
 143
 144 void
 145 set_hot_bb_threshold (gcov_type min)
 146 {
 147   min_count = min;
 148 }
 149
 150 /* Return TRUE if frequency FREQ is considered to be hot.  */
 151
 152 bool
 153 maybe_hot_count_p (struct function *fun, profile_count count)
 154 {
 155   if (!count.initialized_p ())
 156     return true;
 157   if (count.ipa () == profile_count::zero ())
 158     return false;
 159   if (!count.ipa_p ())
 160     {
 161       struct cgraph_node *node = cgraph_node::get (fun->decl);
 162       if (!profile_info || profile_status_for_fn (fun) != PROFILE_READ)
 163         {
 164           if (node->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED)
 165             return false;
 166           if (node->frequency == NODE_FREQUENCY_HOT)
 167             return true;
 168         }
 169       if (profile_status_for_fn (fun) == PROFILE_ABSENT)
 170         return true;
 171       if (node->frequency == NODE_FREQUENCY_EXECUTED_ONCE
 172           && count < (ENTRY_BLOCK_PTR_FOR_FN (fun)->count.apply_scale (2, 3)))
 173         return false;
 174       if (PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION) == 0)
 175         return false;
 176       if (count.apply_scale (PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION), 1)
 177           < ENTRY_BLOCK_PTR_FOR_FN (fun)->count)
 178         return false;
 179       return true;
 180     }
 181   /* Code executed at most once is not hot.  */
 182   if (count <= MAX (profile_info ? profile_info->runs : 1, 1))
 183     return false;
 184   return (count.to_gcov_type () >= get_hot_bb_threshold ());
 185 }
 186
 187 /* Return true in case BB can be CPU intensive and should be optimized
 188    for maximal performance.  */
 189
 190 bool
 191 maybe_hot_bb_p (struct function *fun, const_basic_block bb)
 192 {
 193   gcc_checking_assert (fun);
 194   return maybe_hot_count_p (fun, bb->count);
 195 }
 196
 197 /* Return true in case BB can be CPU intensive and should be optimized
 198    for maximal performance.  */
 199
 200 bool
 201 maybe_hot_edge_p (edge e)
 202 {
 203   return maybe_hot_count_p (cfun, e->count ());
 204 }
 205
 206 /* Return true if profile COUNT and FREQUENCY, or function FUN static
 207    node frequency reflects never being executed.  */
 208
 209 static bool
 210 probably_never_executed (struct function *fun,
 211                          profile_count count)
 212 {
 213   gcc_checking_assert (fun);
 214   if (count.ipa () == profile_count::zero ())
 215     return true;
 216   /* Do not trust adjusted counts.  This will make us to drop int cold section
 217      code with low execution count as a result of inlining. These low counts
 218      are not safe even with read profile and may lead us to dropping
 219      code which actually gets executed into cold section of binary that is not
 220      desirable.  */
 221   if (count.precise_p () && profile_status_for_fn (fun) == PROFILE_READ)
 222     {
 223       int unlikely_count_fraction = PARAM_VALUE (UNLIKELY_BB_COUNT_FRACTION);
 224       if (count.apply_scale (unlikely_count_fraction, 1) >= profile_info->runs)
 225         return false;
 226       return true;
 227     }
 228   if ((!profile_info || profile_status_for_fn (fun) != PROFILE_READ)
 229       && (cgraph_node::get (fun->decl)->frequency
 230           == NODE_FREQUENCY_UNLIKELY_EXECUTED))
 231     return true;
 232   return false;
 233 }
 234
 235
 236 /* Return true in case BB is probably never executed.  */
 237
 238 bool
 239 probably_never_executed_bb_p (struct function *fun, const_basic_block bb)
 240 {
 241   return probably_never_executed (fun, bb->count);
 242 }
 243
 244
 245 /* Return true if E is unlikely executed for obvious reasons.  */
 246
 247 static bool
 248 unlikely_executed_edge_p (edge e)
 249 {
 250   return (e->count () == profile_count::zero ()
 251           || e->probability == profile_probability::never ())
 252          || (e->flags & (EDGE_EH | EDGE_FAKE));
 253 }
 254
 255 /* Return true in case edge E is probably never executed.  */
 256
 257 bool
 258 probably_never_executed_edge_p (struct function *fun, edge e)
 259 {
 260   if (unlikely_executed_edge_p (e))
 261     return true;
 262   return probably_never_executed (fun, e->count ());
 263 }
 264
 265 /* Return true when current function should always be optimized for size.  */
 266
 267 bool
 268 optimize_function_for_size_p (struct function *fun)
 269 {
 270   if (!fun || !fun->decl)
 271     return optimize_size;
 272   cgraph_node *n = cgraph_node::get (fun->decl);
 273   return n && n->optimize_for_size_p ();
 274 }
 275
 276 /* Return true when current function should always be optimized for speed.  */
 277
 278 bool
 279 optimize_function_for_speed_p (struct function *fun)
 280 {
 281   return !optimize_function_for_size_p (fun);
 282 }
 283
 284 /* Return the optimization type that should be used for the function FUN.  */
 285
 286 optimization_type
 287 function_optimization_type (struct function *fun)
 288 {
 289   return (optimize_function_for_speed_p (fun)
 290           ? OPTIMIZE_FOR_SPEED
 291           : OPTIMIZE_FOR_SIZE);
 292 }
 293
 294 /* Return TRUE when BB should be optimized for size.  */
 295
 296 bool
 297 optimize_bb_for_size_p (const_basic_block bb)
 298 {
 299   return (optimize_function_for_size_p (cfun)
 300           || (bb && !maybe_hot_bb_p (cfun, bb)));
 301 }
 302
 303 /* Return TRUE when BB should be optimized for speed.  */
 304
 305 bool
 306 optimize_bb_for_speed_p (const_basic_block bb)
 307 {
 308   return !optimize_bb_for_size_p (bb);
 309 }
 310
 311 /* Return the optimization type that should be used for block BB.  */
 312
 313 optimization_type
 314 bb_optimization_type (const_basic_block bb)
 315 {
 316   return (optimize_bb_for_speed_p (bb)
 317           ? OPTIMIZE_FOR_SPEED
 318           : OPTIMIZE_FOR_SIZE);
 319 }
 320
 321 /* Return TRUE when BB should be optimized for size.  */
 322
 323 bool
 324 optimize_edge_for_size_p (edge e)
 325 {
 326   return optimize_function_for_size_p (cfun) || !maybe_hot_edge_p (e);
 327 }
 328
 329 /* Return TRUE when BB should be optimized for speed.  */
 330
 331 bool
 332 optimize_edge_for_speed_p (edge e)
 333 {
 334   return !optimize_edge_for_size_p (e);
 335 }
 336
 337 /* Return TRUE when BB should be optimized for size.  */
 338
 339 bool
 340 optimize_insn_for_size_p (void)
 341 {
 342   return optimize_function_for_size_p (cfun) || !crtl->maybe_hot_insn_p;
 343 }
 344
 345 /* Return TRUE when BB should be optimized for speed.  */
 346
 347 bool
 348 optimize_insn_for_speed_p (void)
 349 {
 350   return !optimize_insn_for_size_p ();
 351 }
 352
 353 /* Return TRUE when LOOP should be optimized for size.  */
 354
 355 bool
 356 optimize_loop_for_size_p (struct loop *loop)
 357 {
 358   return optimize_bb_for_size_p (loop->header);
 359 }
 360
 361 /* Return TRUE when LOOP should be optimized for speed.  */
 362
 363 bool
 364 optimize_loop_for_speed_p (struct loop *loop)
 365 {
 366   return optimize_bb_for_speed_p (loop->header);
 367 }
 368
 369 /* Return TRUE when LOOP nest should be optimized for speed.  */
 370
 371 bool
 372 optimize_loop_nest_for_speed_p (struct loop *loop)
 373 {
 374   struct loop *l = loop;
 375   if (optimize_loop_for_speed_p (loop))
 376     return true;
 377   l = loop->inner;
 378   while (l && l != loop)
 379     {
 380       if (optimize_loop_for_speed_p (l))
 381         return true;
 382       if (l->inner)
 383         l = l->inner;
 384       else if (l->next)
 385         l = l->next;
 386       else
 387         {
 388           while (l != loop && !l->next)
 389             l = loop_outer (l);
 390           if (l != loop)
 391             l = l->next;
 392         }
 393     }
 394   return false;
 395 }
 396
 397 /* Return TRUE when LOOP nest should be optimized for size.  */
 398
 399 bool
 400 optimize_loop_nest_for_size_p (struct loop *loop)
 401 {
 402   return !optimize_loop_nest_for_speed_p (loop);
 403 }
 404
 405 /* Return true when edge E is likely to be well predictable by branch
 406    predictor.  */
 407
 408 bool
 409 predictable_edge_p (edge e)
 410 {
 411   if (!e->probability.initialized_p ())
 412     return false;
 413   if ((e->probability.to_reg_br_prob_base ()
 414        <= PARAM_VALUE (PARAM_PREDICTABLE_BRANCH_OUTCOME) * REG_BR_PROB_BASE / 100)
 415       || (REG_BR_PROB_BASE - e->probability.to_reg_br_prob_base ()
 416           <= PARAM_VALUE (PARAM_PREDICTABLE_BRANCH_OUTCOME) * REG_BR_PROB_BASE / 100))
 417     return true;
 418   return false;
 419 }
 420
 421
 422 /* Set RTL expansion for BB profile.  */
 423
 424 void
 425 rtl_profile_for_bb (basic_block bb)
 426 {
 427   crtl->maybe_hot_insn_p = maybe_hot_bb_p (cfun, bb);
 428 }
 429
 430 /* Set RTL expansion for edge profile.  */
 431
 432 void
 433 rtl_profile_for_edge (edge e)
 434 {
 435   crtl->maybe_hot_insn_p = maybe_hot_edge_p (e);
 436 }
 437
 438 /* Set RTL expansion to default mode (i.e. when profile info is not known).  */
 439 void
 440 default_rtl_profile (void)
 441 {
 442   crtl->maybe_hot_insn_p = true;
 443 }
 444
 445 /* Return true if the one of outgoing edges is already predicted by
 446    PREDICTOR.  */
 447
 448 bool
 449 rtl_predicted_by_p (const_basic_block bb, enum br_predictor predictor)
 450 {
 451   rtx note;
 452   if (!INSN_P (BB_END (bb)))
 453     return false;
 454   for (note = REG_NOTES (BB_END (bb)); note; note = XEXP (note, 1))
 455     if (REG_NOTE_KIND (note) == REG_BR_PRED
 456         && INTVAL (XEXP (XEXP (note, 0), 0)) == (int)predictor)
 457       return true;
 458   return false;
 459 }
 460
 461 /*  Structure representing predictions in tree level. */
 462
 463 struct edge_prediction {
 464     struct edge_prediction *ep_next;
 465     edge ep_edge;
 466     enum br_predictor ep_predictor;
 467     int ep_probability;
 468 };
 469
 470 /* This map contains for a basic block the list of predictions for the
 471    outgoing edges.  */
 472
 473 static hash_map<const_basic_block, edge_prediction *> *bb_predictions;
 474
 475 /* Return true if the one of outgoing edges is already predicted by
 476    PREDICTOR.  */
 477
 478 bool
 479 gimple_predicted_by_p (const_basic_block bb, enum br_predictor predictor)
 480 {
 481   struct edge_prediction *i;
 482   edge_prediction **preds = bb_predictions->get (bb);
 483
 484   if (!preds)
 485     return false;
 486
 487   for (i = *preds; i; i = i->ep_next)
 488     if (i->ep_predictor == predictor)
 489       return true;
 490   return false;
 491 }
 492
 493 /* Return true if the one of outgoing edges is already predicted by
 494    PREDICTOR for edge E predicted as TAKEN.  */
 495
 496 bool
 497 edge_predicted_by_p (edge e, enum br_predictor predictor, bool taken)
 498 {
 499   struct edge_prediction *i;
 500   basic_block bb = e->src;
 501   edge_prediction **preds = bb_predictions->get (bb);
 502   if (!preds)
 503     return false;
 504
 505   int probability = predictor_info[(int) predictor].hitrate;
 506
 507   if (taken != TAKEN)
 508     probability = REG_BR_PROB_BASE - probability;
 509
 510   for (i = *preds; i; i = i->ep_next)
 511     if (i->ep_predictor == predictor
 512         && i->ep_edge == e
 513         && i->ep_probability == probability)
 514       return true;
 515   return false;
 516 }
 517
 518 /* Same predicate as above, working on edges.  */
 519 bool
 520 edge_probability_reliable_p (const_edge e)
 521 {
 522   return e->probability.probably_reliable_p ();
 523 }
 524
 525 /* Same predicate as edge_probability_reliable_p, working on notes.  */
 526 bool
 527 br_prob_note_reliable_p (const_rtx note)
 528 {
 529   gcc_assert (REG_NOTE_KIND (note) == REG_BR_PROB);
 530   return profile_probability::from_reg_br_prob_note
 531                  (XINT (note, 0)).probably_reliable_p ();
 532 }
 533
 534 static void
 535 predict_insn (rtx_insn *insn, enum br_predictor predictor, int probability)
 536 {
 537   gcc_assert (any_condjump_p (insn));
 538   if (!flag_guess_branch_prob)
 539     return;
 540
 541   add_reg_note (insn, REG_BR_PRED,
 542                 gen_rtx_CONCAT (VOIDmode,
 543                                 GEN_INT ((int) predictor),
 544                                 GEN_INT ((int) probability)));
 545 }
 546
 547 /* Predict insn by given predictor.  */
 548
 549 void
 550 predict_insn_def (rtx_insn *insn, enum br_predictor predictor,
 551                   enum prediction taken)
 552 {
 553    int probability = predictor_info[(int) predictor].hitrate;
 554    gcc_assert (probability != PROB_UNINITIALIZED);
 555
 556    if (taken != TAKEN)
 557      probability = REG_BR_PROB_BASE - probability;
 558
 559    predict_insn (insn, predictor, probability);
 560 }
 561
 562 /* Predict edge E with given probability if possible.  */
 563
 564 void
 565 rtl_predict_edge (edge e, enum br_predictor predictor, int probability)
 566 {
 567   rtx_insn *last_insn;
 568   last_insn = BB_END (e->src);
 569
 570   /* We can store the branch prediction information only about
 571      conditional jumps.  */
 572   if (!any_condjump_p (last_insn))
 573     return;
 574
 575   /* We always store probability of branching.  */
 576   if (e->flags & EDGE_FALLTHRU)
 577     probability = REG_BR_PROB_BASE - probability;
 578
 579   predict_insn (last_insn, predictor, probability);
 580 }
 581
 582 /* Predict edge E with the given PROBABILITY.  */
 583 void
 584 gimple_predict_edge (edge e, enum br_predictor predictor, int probability)
 585 {
 586   if (e->src != ENTRY_BLOCK_PTR_FOR_FN (cfun)
 587       && EDGE_COUNT (e->src->succs) > 1
 588       && flag_guess_branch_prob
 589       && optimize)
 590     {
 591       struct edge_prediction *i = XNEW (struct edge_prediction);
 592       edge_prediction *&preds = bb_predictions->get_or_insert (e->src);
 593
 594       i->ep_next = preds;
 595       preds = i;
 596       i->ep_probability = probability;
 597       i->ep_predictor = predictor;
 598       i->ep_edge = e;
 599     }
 600 }
 601
 602 /* Filter edge predictions PREDS by a function FILTER.  DATA are passed
 603    to the filter function.  */
 604
 605 void
 606 filter_predictions (edge_prediction **preds,
 607                     bool (*filter) (edge_prediction *, void *), void *data)
 608 {
 609   if (!bb_predictions)
 610     return;
 611
 612   if (preds)
 613     {
 614       struct edge_prediction **prediction = preds;
 615       struct edge_prediction *next;
 616
 617       while (*prediction)
 618         {
 619           if ((*filter) (*prediction, data))
 620             prediction = &((*prediction)->ep_next);
 621           else
 622             {
 623               next = (*prediction)->ep_next;
 624               free (*prediction);
 625               *prediction = next;
 626             }
 627         }
 628     }
 629 }
 630
 631 /* Filter function predicate that returns true for a edge predicate P
 632    if its edge is equal to DATA.  */
 633
 634 bool
 635 equal_edge_p (edge_prediction *p, void *data)
 636 {
 637   return p->ep_edge == (edge)data;
 638 }
 639
 640 /* Remove all predictions on given basic block that are attached
 641    to edge E.  */
 642 void
 643 remove_predictions_associated_with_edge (edge e)
 644 {
 645   if (!bb_predictions)
 646     return;
 647
 648   edge_prediction **preds = bb_predictions->get (e->src);
 649   filter_predictions (preds, equal_edge_p, e);
 650 }
 651
 652 /* Clears the list of predictions stored for BB.  */
 653
 654 static void
 655 clear_bb_predictions (basic_block bb)
 656 {
 657   edge_prediction **preds = bb_predictions->get (bb);
 658   struct edge_prediction *pred, *next;
 659
 660   if (!preds)
 661     return;
 662
 663   for (pred = *preds; pred; pred = next)
 664     {
 665       next = pred->ep_next;
 666       free (pred);
 667     }
 668   *preds = NULL;
 669 }
 670
 671 /* Return true when we can store prediction on insn INSN.
 672    At the moment we represent predictions only on conditional
 673    jumps, not at computed jump or other complicated cases.  */
 674 static bool
 675 can_predict_insn_p (const rtx_insn *insn)
 676 {
 677   return (JUMP_P (insn)
 678           && any_condjump_p (insn)
 679           && EDGE_COUNT (BLOCK_FOR_INSN (insn)->succs) >= 2);
 680 }
 681
 682 /* Predict edge E by given predictor if possible.  */
 683
 684 void
 685 predict_edge_def (edge e, enum br_predictor predictor,
 686                   enum prediction taken)
 687 {
 688    int probability = predictor_info[(int) predictor].hitrate;
 689
 690    if (taken != TAKEN)
 691      probability = REG_BR_PROB_BASE - probability;
 692
 693    predict_edge (e, predictor, probability);
 694 }
 695
 696 /* Invert all branch predictions or probability notes in the INSN.  This needs
 697    to be done each time we invert the condition used by the jump.  */
 698
 699 void
 700 invert_br_probabilities (rtx insn)
 701 {
 702   rtx note;
 703
 704   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
 705     if (REG_NOTE_KIND (note) == REG_BR_PROB)
 706       XINT (note, 0) = profile_probability::from_reg_br_prob_note
 707                          (XINT (note, 0)).invert ().to_reg_br_prob_note ();
 708     else if (REG_NOTE_KIND (note) == REG_BR_PRED)
 709       XEXP (XEXP (note, 0), 1)
 710         = GEN_INT (REG_BR_PROB_BASE - INTVAL (XEXP (XEXP (note, 0), 1)));
 711 }
 712
 713 /* Dump information about the branch prediction to the output file.  */
 714
 715 static void
 716 dump_prediction (FILE *file, enum br_predictor predictor, int probability,
 717                  basic_block bb, enum predictor_reason reason = REASON_NONE,
 718                  edge ep_edge = NULL)
 719 {
 720   edge e = ep_edge;
 721   edge_iterator ei;
 722
 723   if (!file)
 724     return;
 725
 726   if (e == NULL)
 727     FOR_EACH_EDGE (e, ei, bb->succs)
 728       if (! (e->flags & EDGE_FALLTHRU))
 729         break;
 730
 731   char edge_info_str[128];
 732   if (ep_edge)
 733     sprintf (edge_info_str, " of edge %d->%d", ep_edge->src->index,
 734              ep_edge->dest->index);
 735   else
 736     edge_info_str[0] = '\0';
 737
 738   fprintf (file, "  %s heuristics%s%s: %.2f%%",
 739            predictor_info[predictor].name,
 740            edge_info_str, reason_messages[reason],
 741            probability * 100.0 / REG_BR_PROB_BASE);
 742
 743   if (bb->count.initialized_p ())
 744     {
 745       fprintf (file, "  exec ");
 746       bb->count.dump (file);
 747       if (e)
 748         {
 749           fprintf (file, " hit ");
 750           e->count ().dump (file);
 751           fprintf (file, " (%.1f%%)", e->count ().to_gcov_type() * 100.0
 752                    / bb->count.to_gcov_type ());
 753         }
 754     }
 755
 756   fprintf (file, "\n");
 757
 758   /* Print output that be easily read by analyze_brprob.py script. We are
 759      interested only in counts that are read from GCDA files.  */
 760   if (dump_file && (dump_flags & TDF_DETAILS)
 761       && bb->count.precise_p ()
 762       && reason == REASON_NONE)
 763     {
 764       gcc_assert (e->count ().precise_p ());
 765       fprintf (file, ";;heuristics;%s;%" PRId64 ";%" PRId64 ";%.1f;\n",
 766                predictor_info[predictor].name,
 767                bb->count.to_gcov_type (), e->count ().to_gcov_type (),
 768                probability * 100.0 / REG_BR_PROB_BASE);
 769     }
 770 }
 771
 772 /* Return true if STMT is known to be unlikely executed.  */
 773
 774 static bool
 775 unlikely_executed_stmt_p (gimple *stmt)
 776 {
 777   if (!is_gimple_call (stmt))
 778     return false;
 779   /* NORETURN attribute alone is not strong enough: exit() may be quite
 780      likely executed once during program run.  */
 781   if (gimple_call_fntype (stmt)
 782       && lookup_attribute ("cold",
 783                            TYPE_ATTRIBUTES (gimple_call_fntype (stmt)))
 784       && !lookup_attribute ("cold", DECL_ATTRIBUTES (current_function_decl)))
 785     return true;
 786   tree decl = gimple_call_fndecl (stmt);
 787   if (!decl)
 788     return false;
 789   if (lookup_attribute ("cold", DECL_ATTRIBUTES (decl))
 790       && !lookup_attribute ("cold", DECL_ATTRIBUTES (current_function_decl)))
 791     return true;
 792
 793   cgraph_node *n = cgraph_node::get (decl);
 794   if (!n)
 795     return false;
 796
 797   availability avail;
 798   n = n->ultimate_alias_target (&avail);
 799   if (avail < AVAIL_AVAILABLE)
 800     return false;
 801   if (!n->analyzed
 802       || n->decl == current_function_decl)
 803     return false;
 804   return n->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED;
 805 }
 806
 807 /* Return true if BB is unlikely executed.  */
 808
 809 static bool
 810 unlikely_executed_bb_p (basic_block bb)
 811 {
 812   if (bb->count == profile_count::zero ())
 813     return true;
 814   if (bb == ENTRY_BLOCK_PTR_FOR_FN (cfun) || bb == EXIT_BLOCK_PTR_FOR_FN (cfun))
 815     return false;
 816   for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
 817        !gsi_end_p (gsi); gsi_next (&gsi))
 818     {
 819       if (unlikely_executed_stmt_p (gsi_stmt (gsi)))
 820         return true;
 821       if (stmt_can_terminate_bb_p (gsi_stmt (gsi)))
 822         return false;
 823     }
 824   return false;
 825 }
 826
 827 /* We can not predict the probabilities of outgoing edges of bb.  Set them
 828    evenly and hope for the best.  If UNLIKELY_EDGES is not null, distribute
 829    even probability for all edges not mentioned in the set.  These edges
 830    are given PROB_VERY_UNLIKELY probability.  */
 831
 832 static void
 833 set_even_probabilities (basic_block bb,
 834                         hash_set<edge> *unlikely_edges = NULL)
 835 {
 836   unsigned nedges = 0, unlikely_count = 0;
 837   edge e = NULL;
 838   edge_iterator ei;
 839   profile_probability all = profile_probability::always ();
 840
 841   FOR_EACH_EDGE (e, ei, bb->succs)
 842     if (e->probability.initialized_p ())
 843       all -= e->probability;
 844     else if (!unlikely_executed_edge_p (e))
 845       {
 846         nedges ++;
 847         if (unlikely_edges != NULL && unlikely_edges->contains (e))
 848           {
 849             all -= profile_probability::very_unlikely ();
 850             unlikely_count++;
 851           }
 852       }
 853
 854   /* Make the distribution even if all edges are unlikely.  */
 855   if (unlikely_count == nedges)
 856     {
 857       unlikely_edges = NULL;
 858       unlikely_count = 0;
 859     }
 860
 861   unsigned c = nedges - unlikely_count;
 862
 863   FOR_EACH_EDGE (e, ei, bb->succs)
 864     if (e->probability.initialized_p ())
 865       ;
 866     else if (!unlikely_executed_edge_p (e))
 867       {
 868         if (unlikely_edges != NULL && unlikely_edges->contains (e))
 869           e->probability = profile_probability::very_unlikely ();
 870         else
 871           e->probability = all.apply_scale (1, c).guessed ();
 872       }
 873     else
 874       e->probability = profile_probability::never ();
 875 }
 876
 877 /* Add REG_BR_PROB note to JUMP with PROB.  */
 878
 879 void
 880 add_reg_br_prob_note (rtx_insn *jump, profile_probability prob)
 881 {
 882   gcc_checking_assert (JUMP_P (jump) && !find_reg_note (jump, REG_BR_PROB, 0));
 883   add_int_reg_note (jump, REG_BR_PROB, prob.to_reg_br_prob_note ());
 884 }
 885
 886 /* Combine all REG_BR_PRED notes into single probability and attach REG_BR_PROB
 887    note if not already present.  Remove now useless REG_BR_PRED notes.  */
 888
 889 static void
 890 combine_predictions_for_insn (rtx_insn *insn, basic_block bb)
 891 {
 892   rtx prob_note;
 893   rtx *pnote;
 894   rtx note;
 895   int best_probability = PROB_EVEN;
 896   enum br_predictor best_predictor = END_PREDICTORS;
 897   int combined_probability = REG_BR_PROB_BASE / 2;
 898   int d;
 899   bool first_match = false;
 900   bool found = false;
 901
 902   if (!can_predict_insn_p (insn))
 903     {
 904       set_even_probabilities (bb);
 905       return;
 906     }
 907
 908   prob_note = find_reg_note (insn, REG_BR_PROB, 0);
 909   pnote = &REG_NOTES (insn);
 910   if (dump_file)
 911     fprintf (dump_file, "Predictions for insn %i bb %i\n", INSN_UID (insn),
 912              bb->index);
 913
 914   /* We implement "first match" heuristics and use probability guessed
 915      by predictor with smallest index.  */
 916   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
 917     if (REG_NOTE_KIND (note) == REG_BR_PRED)
 918       {
 919         enum br_predictor predictor = ((enum br_predictor)
 920                                        INTVAL (XEXP (XEXP (note, 0), 0)));
 921         int probability = INTVAL (XEXP (XEXP (note, 0), 1));
 922
 923         found = true;
 924         if (best_predictor > predictor
 925             && predictor_info[predictor].flags & PRED_FLAG_FIRST_MATCH)
 926           best_probability = probability, best_predictor = predictor;
 927
 928         d = (combined_probability * probability
 929              + (REG_BR_PROB_BASE - combined_probability)
 930              * (REG_BR_PROB_BASE - probability));
 931
 932         /* Use FP math to avoid overflows of 32bit integers.  */
 933         if (d == 0)
 934           /* If one probability is 0% and one 100%, avoid division by zero.  */
 935           combined_probability = REG_BR_PROB_BASE / 2;
 936         else
 937           combined_probability = (((double) combined_probability) * probability
 938                                   * REG_BR_PROB_BASE / d + 0.5);
 939       }
 940
 941   /* Decide which heuristic to use.  In case we didn't match anything,
 942      use no_prediction heuristic, in case we did match, use either
 943      first match or Dempster-Shaffer theory depending on the flags.  */
 944
 945   if (best_predictor != END_PREDICTORS)
 946     first_match = true;
 947
 948   if (!found)
 949     dump_prediction (dump_file, PRED_NO_PREDICTION,
 950                      combined_probability, bb);
 951   else
 952     {
 953       if (!first_match)
 954         dump_prediction (dump_file, PRED_DS_THEORY, combined_probability,
 955                          bb, !first_match ? REASON_NONE : REASON_IGNORED);
 956       else
 957         dump_prediction (dump_file, PRED_FIRST_MATCH, best_probability,
 958                          bb, first_match ? REASON_NONE : REASON_IGNORED);
 959     }
 960
 961   if (first_match)
 962     combined_probability = best_probability;
 963   dump_prediction (dump_file, PRED_COMBINED, combined_probability, bb);
 964
 965   while (*pnote)
 966     {
 967       if (REG_NOTE_KIND (*pnote) == REG_BR_PRED)
 968         {
 969           enum br_predictor predictor = ((enum br_predictor)
 970                                          INTVAL (XEXP (XEXP (*pnote, 0), 0)));
 971           int probability = INTVAL (XEXP (XEXP (*pnote, 0), 1));
 972
 973           dump_prediction (dump_file, predictor, probability, bb,
 974                            (!first_match || best_predictor == predictor)
 975                            ? REASON_NONE : REASON_IGNORED);
 976           *pnote = XEXP (*pnote, 1);
 977         }
 978       else
 979         pnote = &XEXP (*pnote, 1);
 980     }
 981
 982   if (!prob_note)
 983     {
 984       profile_probability p
 985          = profile_probability::from_reg_br_prob_base (combined_probability);
 986       add_reg_br_prob_note (insn, p);
 987
 988       /* Save the prediction into CFG in case we are seeing non-degenerated
 989          conditional jump.  */
 990       if (!single_succ_p (bb))
 991         {
 992           BRANCH_EDGE (bb)->probability = p;
 993           FALLTHRU_EDGE (bb)->probability
 994             = BRANCH_EDGE (bb)->probability.invert ();
 995         }
 996     }
 997   else if (!single_succ_p (bb))
 998     {
 999       profile_probability prob = profile_probability::from_reg_br_prob_note
1000                                         (XINT (prob_note, 0));
1001
1002       BRANCH_EDGE (bb)->probability = prob;
1003       FALLTHRU_EDGE (bb)->probability = prob.invert ();
1004     }
1005   else
1006     single_succ_edge (bb)->probability = profile_probability::always ();
1007 }
1008
1009 /* Edge prediction hash traits.  */
1010
1011 struct predictor_hash: pointer_hash <edge_prediction>
1012 {
1013
1014   static inline hashval_t hash (const edge_prediction *);
1015   static inline bool equal (const edge_prediction *, const edge_prediction *);
1016 };
1017
1018 /* Calculate hash value of an edge prediction P based on predictor and
1019    normalized probability.  */
1020
1021 inline hashval_t
1022 predictor_hash::hash (const edge_prediction *p)
1023 {
1024   inchash::hash hstate;
1025   hstate.add_int (p->ep_predictor);
1026
1027   int prob = p->ep_probability;
1028   if (prob > REG_BR_PROB_BASE / 2)
1029     prob = REG_BR_PROB_BASE - prob;
1030
1031   hstate.add_int (prob);
1032
1033   return hstate.end ();
1034 }
1035
1036 /* Return true whether edge predictions P1 and P2 use the same predictor and
1037    have equal (or opposed probability).  */
1038
1039 inline bool
1040 predictor_hash::equal (const edge_prediction *p1, const edge_prediction *p2)
1041 {
1042   return (p1->ep_predictor == p2->ep_predictor
1043           && (p1->ep_probability == p2->ep_probability
1044               || p1->ep_probability == REG_BR_PROB_BASE - p2->ep_probability));
1045 }
1046
1047 struct predictor_hash_traits: predictor_hash,
1048   typed_noop_remove <edge_prediction *> {};
1049
1050 /* Return true if edge prediction P is not in DATA hash set.  */
1051
1052 static bool
1053 not_removed_prediction_p (edge_prediction *p, void *data)
1054 {
1055   hash_set<edge_prediction *> *remove = (hash_set<edge_prediction *> *) data;
1056   return !remove->contains (p);
1057 }
1058
1059 /* Prune predictions for a basic block BB.  Currently we do following
1060    clean-up steps:
1061
1062    1) remove duplicate prediction that is guessed with the same probability
1063       (different than 1/2) to both edge
1064    2) remove duplicates for a prediction that belongs with the same probability
1065       to a single edge
1066
1067   */
1068
1069 static void
1070 prune_predictions_for_bb (basic_block bb)
1071 {
1072   edge_prediction **preds = bb_predictions->get (bb);
1073
1074   if (preds)
1075     {
1076       hash_table <predictor_hash_traits> s (13);
1077       hash_set <edge_prediction *> remove;
1078
1079       /* Step 1: identify predictors that should be removed.  */
1080       for (edge_prediction *pred = *preds; pred; pred = pred->ep_next)
1081         {
1082           edge_prediction *existing = s.find (pred);
1083           if (existing)
1084             {
1085               if (pred->ep_edge == existing->ep_edge
1086                   && pred->ep_probability == existing->ep_probability)
1087                 {
1088                   /* Remove a duplicate predictor.  */
1089                   dump_prediction (dump_file, pred->ep_predictor,
1090                                    pred->ep_probability, bb,
1091                                    REASON_SINGLE_EDGE_DUPLICATE, pred->ep_edge);
1092
1093                   remove.add (pred);
1094                 }
1095               else if (pred->ep_edge != existing->ep_edge
1096                        && pred->ep_probability == existing->ep_probability
1097                        && pred->ep_probability != REG_BR_PROB_BASE / 2)
1098                 {
1099                   /* Remove both predictors as they predict the same
1100                      for both edges.  */
1101                   dump_prediction (dump_file, existing->ep_predictor,
1102                                    pred->ep_probability, bb,
1103                                    REASON_EDGE_PAIR_DUPLICATE,
1104                                    existing->ep_edge);
1105                   dump_prediction (dump_file, pred->ep_predictor,
1106                                    pred->ep_probability, bb,
1107                                    REASON_EDGE_PAIR_DUPLICATE,
1108                                    pred->ep_edge);
1109
1110                   remove.add (existing);
1111                   remove.add (pred);
1112                 }
1113             }
1114
1115           edge_prediction **slot2 = s.find_slot (pred, INSERT);
1116           *slot2 = pred;
1117         }
1118
1119       /* Step 2: Remove predictors.  */
1120       filter_predictions (preds, not_removed_prediction_p, &remove);
1121     }
1122 }
1123
1124 /* Combine predictions into single probability and store them into CFG.
1125    Remove now useless prediction entries.
1126    If DRY_RUN is set, only produce dumps and do not modify profile.  */
1127
1128 static void
1129 combine_predictions_for_bb (basic_block bb, bool dry_run)
1130 {
1131   int best_probability = PROB_EVEN;
1132   enum br_predictor best_predictor = END_PREDICTORS;
1133   int combined_probability = REG_BR_PROB_BASE / 2;
1134   int d;
1135   bool first_match = false;
1136   bool found = false;
1137   struct edge_prediction *pred;
1138   int nedges = 0;
1139   edge e, first = NULL, second = NULL;
1140   edge_iterator ei;
1141   int nzero = 0;
1142   int nunknown = 0;
1143
1144   FOR_EACH_EDGE (e, ei, bb->succs)
1145     {
1146       if (!unlikely_executed_edge_p (e))
1147         {
1148           nedges ++;
1149           if (first && !second)
1150             second = e;
1151           if (!first)
1152             first = e;
1153         }
1154       else if (!e->probability.initialized_p ())
1155         e->probability = profile_probability::never ();
1156      if (!e->probability.initialized_p ())
1157         nunknown++;
1158      else if (e->probability == profile_probability::never ())
1159         nzero++;
1160     }
1161
1162   /* When there is no successor or only one choice, prediction is easy.
1163
1164      When we have a basic block with more than 2 successors, the situation
1165      is more complicated as DS theory cannot be used literally.
1166      More precisely, let's assume we predicted edge e1 with probability p1,
1167      thus: m1({b1}) = p1.  As we're going to combine more than 2 edges, we
1168      need to find probability of e.g. m1({b2}), which we don't know.
1169      The only approximation is to equally distribute 1-p1 to all edges
1170      different from b1.
1171
1172      According to numbers we've got from SPEC2006 benchark, there's only
1173      one interesting reliable predictor (noreturn call), which can be
1174      handled with a bit easier approach.  */
1175   if (nedges != 2)
1176     {
1177       hash_set<edge> unlikely_edges (4);
1178
1179       /* Identify all edges that have a probability close to very unlikely.
1180          Doing the approach for very unlikely doesn't worth for doing as
1181          there's no such probability in SPEC2006 benchmark.  */
1182       edge_prediction **preds = bb_predictions->get (bb);
1183       if (preds)
1184         for (pred = *preds; pred; pred = pred->ep_next)
1185           if (pred->ep_probability <= PROB_VERY_UNLIKELY)
1186             unlikely_edges.add (pred->ep_edge);
1187
1188       if (!dry_run)
1189         set_even_probabilities (bb, &unlikely_edges);
1190       clear_bb_predictions (bb);
1191       if (dump_file)
1192         {
1193           fprintf (dump_file, "Predictions for bb %i\n", bb->index);
1194           if (unlikely_edges.elements () == 0)
1195             fprintf (dump_file,
1196                      "%i edges in bb %i predicted to even probabilities\n",
1197                      nedges, bb->index);
1198           else
1199             {
1200               fprintf (dump_file,
1201                        "%i edges in bb %i predicted with some unlikely edges\n",
1202                        nedges, bb->index);
1203               FOR_EACH_EDGE (e, ei, bb->succs)
1204                 if (!unlikely_executed_edge_p (e))
1205                   dump_prediction (dump_file, PRED_COMBINED,
1206                    e->probability.to_reg_br_prob_base (), bb, REASON_NONE, e);
1207             }
1208         }
1209       return;
1210     }
1211
1212   if (dump_file)
1213     fprintf (dump_file, "Predictions for bb %i\n", bb->index);
1214
1215   prune_predictions_for_bb (bb);
1216
1217   edge_prediction **preds = bb_predictions->get (bb);
1218
1219   if (preds)
1220     {
1221       /* We implement "first match" heuristics and use probability guessed
1222          by predictor with smallest index.  */
1223       for (pred = *preds; pred; pred = pred->ep_next)
1224         {
1225           enum br_predictor predictor = pred->ep_predictor;
1226           int probability = pred->ep_probability;
1227
1228           if (pred->ep_edge != first)
1229             probability = REG_BR_PROB_BASE - probability;
1230
1231           found = true;
1232           /* First match heuristics would be widly confused if we predicted
1233              both directions.  */
1234           if (best_predictor > predictor
1235             && predictor_info[predictor].flags & PRED_FLAG_FIRST_MATCH)
1236             {
1237               struct edge_prediction *pred2;
1238               int prob = probability;
1239
1240               for (pred2 = (struct edge_prediction *) *preds;
1241                    pred2; pred2 = pred2->ep_next)
1242                if (pred2 != pred && pred2->ep_predictor == pred->ep_predictor)
1243                  {
1244                    int probability2 = pred2->ep_probability;
1245
1246                    if (pred2->ep_edge != first)
1247                      probability2 = REG_BR_PROB_BASE - probability2;
1248
1249                    if ((probability < REG_BR_PROB_BASE / 2) !=
1250                        (probability2 < REG_BR_PROB_BASE / 2))
1251                      break;
1252
1253                    /* If the same predictor later gave better result, go for it! */
1254                    if ((probability >= REG_BR_PROB_BASE / 2 && (probability2 > probability))
1255                        || (probability <= REG_BR_PROB_BASE / 2 && (probability2 < probability)))
1256                      prob = probability2;
1257                  }
1258               if (!pred2)
1259                 best_probability = prob, best_predictor = predictor;
1260             }
1261
1262           d = (combined_probability * probability
1263                + (REG_BR_PROB_BASE - combined_probability)
1264                * (REG_BR_PROB_BASE - probability));
1265
1266           /* Use FP math to avoid overflows of 32bit integers.  */
1267           if (d == 0)
1268             /* If one probability is 0% and one 100%, avoid division by zero.  */
1269             combined_probability = REG_BR_PROB_BASE / 2;
1270           else
1271             combined_probability = (((double) combined_probability)
1272                                     * probability
1273                                     * REG_BR_PROB_BASE / d + 0.5);
1274         }
1275     }
1276
1277   /* Decide which heuristic to use.  In case we didn't match anything,
1278      use no_prediction heuristic, in case we did match, use either
1279      first match or Dempster-Shaffer theory depending on the flags.  */
1280
1281   if (best_predictor != END_PREDICTORS)
1282     first_match = true;
1283
1284   if (!found)
1285     dump_prediction (dump_file, PRED_NO_PREDICTION, combined_probability, bb);
1286   else
1287     {
1288       if (!first_match)
1289         dump_prediction (dump_file, PRED_DS_THEORY, combined_probability, bb,
1290                          !first_match ? REASON_NONE : REASON_IGNORED);
1291       else
1292         dump_prediction (dump_file, PRED_FIRST_MATCH, best_probability, bb,
1293                          first_match ? REASON_NONE : REASON_IGNORED);
1294     }
1295
1296   if (first_match)
1297     combined_probability = best_probability;
1298   dump_prediction (dump_file, PRED_COMBINED, combined_probability, bb);
1299
1300   if (preds)
1301     {
1302       for (pred = (struct edge_prediction *) *preds; pred; pred = pred->ep_next)
1303         {
1304           enum br_predictor predictor = pred->ep_predictor;
1305           int probability = pred->ep_probability;
1306
1307           dump_prediction (dump_file, predictor, probability, bb,
1308                            (!first_match || best_predictor == predictor)
1309                            ? REASON_NONE : REASON_IGNORED, pred->ep_edge);
1310         }
1311     }
1312   clear_bb_predictions (bb);
1313
1314
1315   /* If we have only one successor which is unknown, we can compute missing
1316      probablity.  */
1317   if (nunknown == 1)
1318     {
1319       profile_probability prob = profile_probability::always ();
1320       edge missing = NULL;
1321
1322       FOR_EACH_EDGE (e, ei, bb->succs)
1323         if (e->probability.initialized_p ())
1324           prob -= e->probability;
1325         else if (missing == NULL)
1326           missing = e;
1327         else
1328           gcc_unreachable ();
1329        missing->probability = prob;
1330     }
1331   /* If nothing is unknown, we have nothing to update.  */
1332   else if (!nunknown && nzero != (int)EDGE_COUNT (bb->succs))
1333     ;
1334   else if (!dry_run)
1335     {
1336       first->probability
1337          = profile_probability::from_reg_br_prob_base (combined_probability);
1338       second->probability = first->probability.invert ();
1339     }
1340 }
1341
1342 /* Check if T1 and T2 satisfy the IV_COMPARE condition.
1343    Return the SSA_NAME if the condition satisfies, NULL otherwise.
1344
1345    T1 and T2 should be one of the following cases:
1346      1. T1 is SSA_NAME, T2 is NULL
1347      2. T1 is SSA_NAME, T2 is INTEGER_CST between [-4, 4]
1348      3. T2 is SSA_NAME, T1 is INTEGER_CST between [-4, 4]  */
1349
1350 static tree
1351 strips_small_constant (tree t1, tree t2)
1352 {
1353   tree ret = NULL;
1354   int value = 0;
1355
1356   if (!t1)
1357     return NULL;
1358   else if (TREE_CODE (t1) == SSA_NAME)
1359     ret = t1;
1360   else if (tree_fits_shwi_p (t1))
1361     value = tree_to_shwi (t1);
1362   else
1363     return NULL;
1364
1365   if (!t2)
1366     return ret;
1367   else if (tree_fits_shwi_p (t2))
1368     value = tree_to_shwi (t2);
1369   else if (TREE_CODE (t2) == SSA_NAME)
1370     {
1371       if (ret)
1372         return NULL;
1373       else
1374         ret = t2;
1375     }
1376
1377   if (value <= 4 && value >= -4)
1378     return ret;
1379   else
1380     return NULL;
1381 }
1382
1383 /* Return the SSA_NAME in T or T's operands.
1384    Return NULL if SSA_NAME cannot be found.  */
1385
1386 static tree
1387 get_base_value (tree t)
1388 {
1389   if (TREE_CODE (t) == SSA_NAME)
1390     return t;
1391
1392   if (!BINARY_CLASS_P (t))
1393     return NULL;
1394
1395   switch (TREE_OPERAND_LENGTH (t))
1396     {
1397     case 1:
1398       return strips_small_constant (TREE_OPERAND (t, 0), NULL);
1399     case 2:
1400       return strips_small_constant (TREE_OPERAND (t, 0),
1401                                     TREE_OPERAND (t, 1));
1402     default:
1403       return NULL;
1404     }
1405 }
1406
1407 /* Check the compare STMT in LOOP. If it compares an induction
1408    variable to a loop invariant, return true, and save
1409    LOOP_INVARIANT, COMPARE_CODE and LOOP_STEP.
1410    Otherwise return false and set LOOP_INVAIANT to NULL.  */
1411
1412 static bool
1413 is_comparison_with_loop_invariant_p (gcond *stmt, struct loop *loop,
1414                                      tree *loop_invariant,
1415                                      enum tree_code *compare_code,
1416                                      tree *loop_step,
1417                                      tree *loop_iv_base)
1418 {
1419   tree op0, op1, bound, base;
1420   affine_iv iv0, iv1;
1421   enum tree_code code;
1422   tree step;
1423
1424   code = gimple_cond_code (stmt);
1425   *loop_invariant = NULL;
1426
1427   switch (code)
1428     {
1429     case GT_EXPR:
1430     case GE_EXPR:
1431     case NE_EXPR:
1432     case LT_EXPR:
1433     case LE_EXPR:
1434     case EQ_EXPR:
1435       break;
1436
1437     default:
1438       return false;
1439     }
1440
1441   op0 = gimple_cond_lhs (stmt);
1442   op1 = gimple_cond_rhs (stmt);
1443
1444   if ((TREE_CODE (op0) != SSA_NAME && TREE_CODE (op0) != INTEGER_CST)
1445        || (TREE_CODE (op1) != SSA_NAME && TREE_CODE (op1) != INTEGER_CST))
1446     return false;
1447   if (!simple_iv (loop, loop_containing_stmt (stmt), op0, &iv0, true))
1448     return false;
1449   if (!simple_iv (loop, loop_containing_stmt (stmt), op1, &iv1, true))
1450     return false;
1451   if (TREE_CODE (iv0.step) != INTEGER_CST
1452       || TREE_CODE (iv1.step) != INTEGER_CST)
1453     return false;
1454   if ((integer_zerop (iv0.step) && integer_zerop (iv1.step))
1455       || (!integer_zerop (iv0.step) && !integer_zerop (iv1.step)))
1456     return false;
1457
1458   if (integer_zerop (iv0.step))
1459     {
1460       if (code != NE_EXPR && code != EQ_EXPR)
1461         code = invert_tree_comparison (code, false);
1462       bound = iv0.base;
1463       base = iv1.base;
1464       if (tree_fits_shwi_p (iv1.step))
1465         step = iv1.step;
1466       else
1467         return false;
1468     }
1469   else
1470     {
1471       bound = iv1.base;
1472       base = iv0.base;
1473       if (tree_fits_shwi_p (iv0.step))
1474         step = iv0.step;
1475       else
1476         return false;
1477     }
1478
1479   if (TREE_CODE (bound) != INTEGER_CST)
1480     bound = get_base_value (bound);
1481   if (!bound)
1482     return false;
1483   if (TREE_CODE (base) != INTEGER_CST)
1484     base = get_base_value (base);
1485   if (!base)
1486     return false;
1487
1488   *loop_invariant = bound;
1489   *compare_code = code;
1490   *loop_step = step;
1491   *loop_iv_base = base;
1492   return true;
1493 }
1494
1495 /* Compare two SSA_NAMEs: returns TRUE if T1 and T2 are value coherent.  */
1496
1497 static bool
1498 expr_coherent_p (tree t1, tree t2)
1499 {
1500   gimple *stmt;
1501   tree ssa_name_1 = NULL;
1502   tree ssa_name_2 = NULL;
1503
1504   gcc_assert (TREE_CODE (t1) == SSA_NAME || TREE_CODE (t1) == INTEGER_CST);
1505   gcc_assert (TREE_CODE (t2) == SSA_NAME || TREE_CODE (t2) == INTEGER_CST);
1506
1507   if (t1 == t2)
1508     return true;
1509
1510   if (TREE_CODE (t1) == INTEGER_CST && TREE_CODE (t2) == INTEGER_CST)
1511     return true;
1512   if (TREE_CODE (t1) == INTEGER_CST || TREE_CODE (t2) == INTEGER_CST)
1513     return false;
1514
1515   /* Check to see if t1 is expressed/defined with t2.  */
1516   stmt = SSA_NAME_DEF_STMT (t1);
1517   gcc_assert (stmt != NULL);
1518   if (is_gimple_assign (stmt))
1519     {
1520       ssa_name_1 = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
1521       if (ssa_name_1 && ssa_name_1 == t2)
1522         return true;
1523     }
1524
1525   /* Check to see if t2 is expressed/defined with t1.  */
1526   stmt = SSA_NAME_DEF_STMT (t2);
1527   gcc_assert (stmt != NULL);
1528   if (is_gimple_assign (stmt))
1529     {
1530       ssa_name_2 = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
1531       if (ssa_name_2 && ssa_name_2 == t1)
1532         return true;
1533     }
1534
1535   /* Compare if t1 and t2's def_stmts are identical.  */
1536   if (ssa_name_2 != NULL && ssa_name_1 == ssa_name_2)
1537     return true;
1538   else
1539     return false;
1540 }
1541
1542 /* Return true if E is predicted by one of loop heuristics.  */
1543
1544 static bool
1545 predicted_by_loop_heuristics_p (basic_block bb)
1546 {
1547   struct edge_prediction *i;
1548   edge_prediction **preds = bb_predictions->get (bb);
1549
1550   if (!preds)
1551     return false;
1552
1553   for (i = *preds; i; i = i->ep_next)
1554     if (i->ep_predictor == PRED_LOOP_ITERATIONS_GUESSED
1555         || i->ep_predictor == PRED_LOOP_ITERATIONS_MAX
1556         || i->ep_predictor == PRED_LOOP_ITERATIONS
1557         || i->ep_predictor == PRED_LOOP_EXIT
1558         || i->ep_predictor == PRED_LOOP_EXIT_WITH_RECURSION
1559         || i->ep_predictor == PRED_LOOP_EXTRA_EXIT)
1560       return true;
1561   return false;
1562 }
1563
1564 /* Predict branch probability of BB when BB contains a branch that compares
1565    an induction variable in LOOP with LOOP_IV_BASE_VAR to LOOP_BOUND_VAR. The
1566    loop exit is compared using LOOP_BOUND_CODE, with step of LOOP_BOUND_STEP.
1567
1568    E.g.
1569      for (int i = 0; i < bound; i++) {
1570        if (i < bound - 2)
1571          computation_1();
1572        else
1573          computation_2();
1574      }
1575
1576   In this loop, we will predict the branch inside the loop to be taken.  */
1577
1578 static void
1579 predict_iv_comparison (struct loop *loop, basic_block bb,
1580                        tree loop_bound_var,
1581                        tree loop_iv_base_var,
1582                        enum tree_code loop_bound_code,
1583                        int loop_bound_step)
1584 {
1585   gimple *stmt;
1586   tree compare_var, compare_base;
1587   enum tree_code compare_code;
1588   tree compare_step_var;
1589   edge then_edge;
1590   edge_iterator ei;
1591
1592   if (predicted_by_loop_heuristics_p (bb))
1593     return;
1594
1595   stmt = last_stmt (bb);
1596   if (!stmt || gimple_code (stmt) != GIMPLE_COND)
1597     return;
1598   if (!is_comparison_with_loop_invariant_p (as_a <gcond *> (stmt),
1599                                             loop, &compare_var,
1600                                             &compare_code,
1601                                             &compare_step_var,
1602                                             &compare_base))
1603     return;
1604
1605   /* Find the taken edge.  */
1606   FOR_EACH_EDGE (then_edge, ei, bb->succs)
1607     if (then_edge->flags & EDGE_TRUE_VALUE)
1608       break;
1609
1610   /* When comparing an IV to a loop invariant, NE is more likely to be
1611      taken while EQ is more likely to be not-taken.  */
1612   if (compare_code == NE_EXPR)
1613     {
1614       predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1615       return;
1616     }
1617   else if (compare_code == EQ_EXPR)
1618     {
1619       predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1620       return;
1621     }
1622
1623   if (!expr_coherent_p (loop_iv_base_var, compare_base))
1624     return;
1625
1626   /* If loop bound, base and compare bound are all constants, we can
1627      calculate the probability directly.  */
1628   if (tree_fits_shwi_p (loop_bound_var)
1629       && tree_fits_shwi_p (compare_var)
1630       && tree_fits_shwi_p (compare_base))
1631     {
1632       int probability;
1633       wi::overflow_type overflow;
1634       bool overall_overflow = false;
1635       widest_int compare_count, tem;
1636
1637       /* (loop_bound - base) / compare_step */
1638       tem = wi::sub (wi::to_widest (loop_bound_var),
1639                      wi::to_widest (compare_base), SIGNED, &overflow);
1640       overall_overflow |= overflow;
1641       widest_int loop_count = wi::div_trunc (tem,
1642                                              wi::to_widest (compare_step_var),
1643                                              SIGNED, &overflow);
1644       overall_overflow |= overflow;
1645
1646       if (!wi::neg_p (wi::to_widest (compare_step_var))
1647           ^ (compare_code == LT_EXPR || compare_code == LE_EXPR))
1648         {
1649           /* (loop_bound - compare_bound) / compare_step */
1650           tem = wi::sub (wi::to_widest (loop_bound_var),
1651                          wi::to_widest (compare_var), SIGNED, &overflow);
1652           overall_overflow |= overflow;
1653           compare_count = wi::div_trunc (tem, wi::to_widest (compare_step_var),
1654                                          SIGNED, &overflow);
1655           overall_overflow |= overflow;
1656         }
1657       else
1658         {
1659           /* (compare_bound - base) / compare_step */
1660           tem = wi::sub (wi::to_widest (compare_var),
1661                          wi::to_widest (compare_base), SIGNED, &overflow);
1662           overall_overflow |= overflow;
1663           compare_count = wi::div_trunc (tem, wi::to_widest (compare_step_var),
1664                                          SIGNED, &overflow);
1665           overall_overflow |= overflow;
1666         }
1667       if (compare_code == LE_EXPR || compare_code == GE_EXPR)
1668         ++compare_count;
1669       if (loop_bound_code == LE_EXPR || loop_bound_code == GE_EXPR)
1670         ++loop_count;
1671       if (wi::neg_p (compare_count))
1672         compare_count = 0;
1673       if (wi::neg_p (loop_count))
1674         loop_count = 0;
1675       if (loop_count == 0)
1676         probability = 0;
1677       else if (wi::cmps (compare_count, loop_count) == 1)
1678         probability = REG_BR_PROB_BASE;
1679       else
1680         {
1681           tem = compare_count * REG_BR_PROB_BASE;
1682           tem = wi::udiv_trunc (tem, loop_count);
1683           probability = tem.to_uhwi ();
1684         }
1685
1686       /* FIXME: The branch prediction seems broken. It has only 20% hitrate.  */
1687       if (!overall_overflow)
1688         predict_edge (then_edge, PRED_LOOP_IV_COMPARE, probability);
1689
1690       return;
1691     }
1692
1693   if (expr_coherent_p (loop_bound_var, compare_var))
1694     {
1695       if ((loop_bound_code == LT_EXPR || loop_bound_code == LE_EXPR)
1696           && (compare_code == LT_EXPR || compare_code == LE_EXPR))
1697         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1698       else if ((loop_bound_code == GT_EXPR || loop_bound_code == GE_EXPR)
1699                && (compare_code == GT_EXPR || compare_code == GE_EXPR))
1700         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1701       else if (loop_bound_code == NE_EXPR)
1702         {
1703           /* If the loop backedge condition is "(i != bound)", we do
1704              the comparison based on the step of IV:
1705              * step < 0 : backedge condition is like (i > bound)
1706              * step > 0 : backedge condition is like (i < bound)  */
1707           gcc_assert (loop_bound_step != 0);
1708           if (loop_bound_step > 0
1709               && (compare_code == LT_EXPR
1710                   || compare_code == LE_EXPR))
1711             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1712           else if (loop_bound_step < 0
1713                    && (compare_code == GT_EXPR
1714                        || compare_code == GE_EXPR))
1715             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1716           else
1717             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1718         }
1719       else
1720         /* The branch is predicted not-taken if loop_bound_code is
1721            opposite with compare_code.  */
1722         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1723     }
1724   else if (expr_coherent_p (loop_iv_base_var, compare_var))
1725     {
1726       /* For cases like:
1727            for (i = s; i < h; i++)
1728              if (i > s + 2) ....
1729          The branch should be predicted taken.  */
1730       if (loop_bound_step > 0
1731           && (compare_code == GT_EXPR || compare_code == GE_EXPR))
1732         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1733       else if (loop_bound_step < 0
1734                && (compare_code == LT_EXPR || compare_code == LE_EXPR))
1735         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1736       else
1737         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1738     }
1739 }
1740
1741 /* Predict for extra loop exits that will lead to EXIT_EDGE. The extra loop
1742    exits are resulted from short-circuit conditions that will generate an
1743    if_tmp. E.g.:
1744
1745    if (foo() || global > 10)
1746      break;
1747
1748    This will be translated into:
1749
1750    BB3:
1751      loop header...
1752    BB4:
1753      if foo() goto BB6 else goto BB5
1754    BB5:
1755      if global > 10 goto BB6 else goto BB7
1756    BB6:
1757      goto BB7
1758    BB7:
1759      iftmp = (PHI 0(BB5), 1(BB6))
1760      if iftmp == 1 goto BB8 else goto BB3
1761    BB8:
1762      outside of the loop...
1763
1764    The edge BB7->BB8 is loop exit because BB8 is outside of the loop.
1765    From the dataflow, we can infer that BB4->BB6 and BB5->BB6 are also loop
1766    exits. This function takes BB7->BB8 as input, and finds out the extra loop
1767    exits to predict them using PRED_LOOP_EXTRA_EXIT.  */
1768
1769 static void
1770 predict_extra_loop_exits (edge exit_edge)
1771 {
1772   unsigned i;
1773   bool check_value_one;
1774   gimple *lhs_def_stmt;
1775   gphi *phi_stmt;
1776   tree cmp_rhs, cmp_lhs;
1777   gimple *last;
1778   gcond *cmp_stmt;
1779
1780   last = last_stmt (exit_edge->src);
1781   if (!last)
1782     return;
1783   cmp_stmt = dyn_cast <gcond *> (last);
1784   if (!cmp_stmt)
1785     return;
1786
1787   cmp_rhs = gimple_cond_rhs (cmp_stmt);
1788   cmp_lhs = gimple_cond_lhs (cmp_stmt);
1789   if (!TREE_CONSTANT (cmp_rhs)
1790       || !(integer_zerop (cmp_rhs) || integer_onep (cmp_rhs)))
1791     return;
1792   if (TREE_CODE (cmp_lhs) != SSA_NAME)
1793     return;
1794
1795   /* If check_value_one is true, only the phi_args with value '1' will lead
1796      to loop exit. Otherwise, only the phi_args with value '0' will lead to
1797      loop exit.  */
1798   check_value_one = (((integer_onep (cmp_rhs))
1799                     ^ (gimple_cond_code (cmp_stmt) == EQ_EXPR))
1800                     ^ ((exit_edge->flags & EDGE_TRUE_VALUE) != 0));
1801
1802   lhs_def_stmt = SSA_NAME_DEF_STMT (cmp_lhs);
1803   if (!lhs_def_stmt)
1804     return;
1805
1806   phi_stmt = dyn_cast <gphi *> (lhs_def_stmt);
1807   if (!phi_stmt)
1808     return;
1809
1810   for (i = 0; i < gimple_phi_num_args (phi_stmt); i++)
1811     {
1812       edge e1;
1813       edge_iterator ei;
1814       tree val = gimple_phi_arg_def (phi_stmt, i);
1815       edge e = gimple_phi_arg_edge (phi_stmt, i);
1816
1817       if (!TREE_CONSTANT (val) || !(integer_zerop (val) || integer_onep (val)))
1818         continue;
1819       if ((check_value_one ^ integer_onep (val)) == 1)
1820         continue;
1821       if (EDGE_COUNT (e->src->succs) != 1)
1822         {
1823           predict_paths_leading_to_edge (e, PRED_LOOP_EXTRA_EXIT, NOT_TAKEN);
1824           continue;
1825         }
1826
1827       FOR_EACH_EDGE (e1, ei, e->src->preds)
1828         predict_paths_leading_to_edge (e1, PRED_LOOP_EXTRA_EXIT, NOT_TAKEN);
1829     }
1830 }
1831
1832
1833 /* Predict edge probabilities by exploiting loop structure.  */
1834
1835 static void
1836 predict_loops (void)
1837 {
1838   struct loop *loop;
1839   basic_block bb;
1840   hash_set <struct loop *> with_recursion(10);
1841
1842   FOR_EACH_BB_FN (bb, cfun)
1843     {
1844       gimple_stmt_iterator gsi;
1845       tree decl;
1846
1847       for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1848         if (is_gimple_call (gsi_stmt (gsi))
1849             && (decl = gimple_call_fndecl (gsi_stmt (gsi))) != NULL
1850             && recursive_call_p (current_function_decl, decl))
1851           {
1852             loop = bb->loop_father;
1853             while (loop && !with_recursion.add (loop))
1854               loop = loop_outer (loop);
1855           }
1856     }
1857
1858   /* Try to predict out blocks in a loop that are not part of a
1859      natural loop.  */
1860   FOR_EACH_LOOP (loop, LI_FROM_INNERMOST)
1861     {
1862       basic_block bb, *bbs;
1863       unsigned j, n_exits = 0;
1864       vec<edge> exits;
1865       struct tree_niter_desc niter_desc;
1866       edge ex;
1867       struct nb_iter_bound *nb_iter;
1868       enum tree_code loop_bound_code = ERROR_MARK;
1869       tree loop_bound_step = NULL;
1870       tree loop_bound_var = NULL;
1871       tree loop_iv_base = NULL;
1872       gcond *stmt = NULL;
1873       bool recursion = with_recursion.contains (loop);
1874
1875       exits = get_loop_exit_edges (loop);
1876       FOR_EACH_VEC_ELT (exits, j, ex)
1877         if (!unlikely_executed_edge_p (ex) && !(ex->flags & EDGE_ABNORMAL_CALL))
1878           n_exits ++;
1879       if (!n_exits)
1880         {
1881           exits.release ();
1882           continue;
1883         }
1884
1885       if (dump_file && (dump_flags & TDF_DETAILS))
1886         fprintf (dump_file, "Predicting loop %i%s with %i exits.\n",
1887                  loop->num, recursion ? " (with recursion)":"", n_exits);
1888       if (dump_file && (dump_flags & TDF_DETAILS)
1889           && max_loop_iterations_int (loop) >= 0)
1890         {
1891           fprintf (dump_file,
1892                    "Loop %d iterates at most %i times.\n", loop->num,
1893                    (int)max_loop_iterations_int (loop));
1894         }
1895       if (dump_file && (dump_flags & TDF_DETAILS)
1896           && likely_max_loop_iterations_int (loop) >= 0)
1897         {
1898           fprintf (dump_file, "Loop %d likely iterates at most %i times.\n",
1899                    loop->num, (int)likely_max_loop_iterations_int (loop));
1900         }
1901
1902       FOR_EACH_VEC_ELT (exits, j, ex)
1903         {
1904           tree niter = NULL;
1905           HOST_WIDE_INT nitercst;
1906           int max = PARAM_VALUE (PARAM_MAX_PREDICTED_ITERATIONS);
1907           int probability;
1908           enum br_predictor predictor;
1909           widest_int nit;
1910
1911           if (unlikely_executed_edge_p (ex)
1912               || (ex->flags & EDGE_ABNORMAL_CALL))
1913             continue;
1914           /* Loop heuristics do not expect exit conditional to be inside
1915              inner loop.  We predict from innermost to outermost loop.  */
1916           if (predicted_by_loop_heuristics_p (ex->src))
1917             {
1918               if (dump_file && (dump_flags & TDF_DETAILS))
1919                 fprintf (dump_file, "Skipping exit %i->%i because "
1920                          "it is already predicted.\n",
1921                          ex->src->index, ex->dest->index);
1922               continue;
1923             }
1924           predict_extra_loop_exits (ex);
1925
1926           if (number_of_iterations_exit (loop, ex, &niter_desc, false, false))
1927             niter = niter_desc.niter;
1928           if (!niter || TREE_CODE (niter_desc.niter) != INTEGER_CST)
1929             niter = loop_niter_by_eval (loop, ex);
1930           if (dump_file && (dump_flags & TDF_DETAILS)
1931               && TREE_CODE (niter) == INTEGER_CST)
1932             {
1933               fprintf (dump_file, "Exit %i->%i %d iterates ",
1934                        ex->src->index, ex->dest->index,
1935                        loop->num);
1936               print_generic_expr (dump_file, niter, TDF_SLIM);
1937               fprintf (dump_file, " times.\n");
1938             }
1939
1940           if (TREE_CODE (niter) == INTEGER_CST)
1941             {
1942               if (tree_fits_uhwi_p (niter)
1943                   && max
1944                   && compare_tree_int (niter, max - 1) == -1)
1945                 nitercst = tree_to_uhwi (niter) + 1;
1946               else
1947                 nitercst = max;
1948               predictor = PRED_LOOP_ITERATIONS;
1949             }
1950           /* If we have just one exit and we can derive some information about
1951              the number of iterations of the loop from the statements inside
1952              the loop, use it to predict this exit.  */
1953           else if (n_exits == 1
1954                    && estimated_stmt_executions (loop, &nit))
1955             {
1956               if (wi::gtu_p (nit, max))
1957                 nitercst = max;
1958               else
1959                 nitercst = nit.to_shwi ();
1960               predictor = PRED_LOOP_ITERATIONS_GUESSED;
1961             }
1962           /* If we have likely upper bound, trust it for very small iteration
1963              counts.  Such loops would otherwise get mispredicted by standard
1964              LOOP_EXIT heuristics.  */
1965           else if (n_exits == 1
1966                    && likely_max_stmt_executions (loop, &nit)
1967                    && wi::ltu_p (nit,
1968                                  RDIV (REG_BR_PROB_BASE,
1969                                        REG_BR_PROB_BASE
1970                                          - predictor_info
1971                                                  [recursion
1972                                                   ? PRED_LOOP_EXIT_WITH_RECURSION
1973                                                   : PRED_LOOP_EXIT].hitrate)))
1974             {
1975               nitercst = nit.to_shwi ();
1976               predictor = PRED_LOOP_ITERATIONS_MAX;
1977             }
1978           else
1979             {
1980               if (dump_file && (dump_flags & TDF_DETAILS))
1981                 fprintf (dump_file, "Nothing known about exit %i->%i.\n",
1982                          ex->src->index, ex->dest->index);
1983               continue;
1984             }
1985
1986           if (dump_file && (dump_flags & TDF_DETAILS))
1987             fprintf (dump_file, "Recording prediction to %i iterations by %s.\n",
1988                      (int)nitercst, predictor_info[predictor].name);
1989           /* If the prediction for number of iterations is zero, do not
1990              predict the exit edges.  */
1991           if (nitercst == 0)
1992             continue;
1993
1994           probability = RDIV (REG_BR_PROB_BASE, nitercst);
1995           predict_edge (ex, predictor, probability);
1996         }
1997       exits.release ();
1998
1999       /* Find information about loop bound variables.  */
2000       for (nb_iter = loop->bounds; nb_iter;
2001            nb_iter = nb_iter->next)
2002         if (nb_iter->stmt
2003             && gimple_code (nb_iter->stmt) == GIMPLE_COND)
2004           {
2005             stmt = as_a <gcond *> (nb_iter->stmt);
2006             break;
2007           }
2008       if (!stmt && last_stmt (loop->header)
2009           && gimple_code (last_stmt (loop->header)) == GIMPLE_COND)
2010         stmt = as_a <gcond *> (last_stmt (loop->header));
2011       if (stmt)
2012         is_comparison_with_loop_invariant_p (stmt, loop,
2013                                              &loop_bound_var,
2014                                              &loop_bound_code,
2015                                              &loop_bound_step,
2016                                              &loop_iv_base);
2017
2018       bbs = get_loop_body (loop);
2019
2020       for (j = 0; j < loop->num_nodes; j++)
2021         {
2022           edge e;
2023           edge_iterator ei;
2024
2025           bb = bbs[j];
2026
2027           /* Bypass loop heuristics on continue statement.  These
2028              statements construct loops via "non-loop" constructs
2029              in the source language and are better to be handled
2030              separately.  */
2031           if (predicted_by_p (bb, PRED_CONTINUE))
2032             {
2033               if (dump_file && (dump_flags & TDF_DETAILS))
2034                 fprintf (dump_file, "BB %i predicted by continue.\n",
2035                          bb->index);
2036               continue;
2037             }
2038
2039           /* If we already used more reliable loop exit predictors, do not
2040              bother with PRED_LOOP_EXIT.  */
2041           if (!predicted_by_loop_heuristics_p (bb))
2042             {
2043               /* For loop with many exits we don't want to predict all exits
2044                  with the pretty large probability, because if all exits are
2045                  considered in row, the loop would be predicted to iterate
2046                  almost never.  The code to divide probability by number of
2047                  exits is very rough.  It should compute the number of exits
2048                  taken in each patch through function (not the overall number
2049                  of exits that might be a lot higher for loops with wide switch
2050                  statements in them) and compute n-th square root.
2051
2052                  We limit the minimal probability by 2% to avoid
2053                  EDGE_PROBABILITY_RELIABLE from trusting the branch prediction
2054                  as this was causing regression in perl benchmark containing such
2055                  a wide loop.  */
2056
2057               int probability = ((REG_BR_PROB_BASE
2058                                   - predictor_info
2059                                      [recursion
2060                                       ? PRED_LOOP_EXIT_WITH_RECURSION
2061                                       : PRED_LOOP_EXIT].hitrate)
2062                                  / n_exits);
2063               if (probability < HITRATE (2))
2064                 probability = HITRATE (2);
2065               FOR_EACH_EDGE (e, ei, bb->succs)
2066                 if (e->dest->index < NUM_FIXED_BLOCKS
2067                     || !flow_bb_inside_loop_p (loop, e->dest))
2068                   {
2069                     if (dump_file && (dump_flags & TDF_DETAILS))
2070                       fprintf (dump_file,
2071                                "Predicting exit %i->%i with prob %i.\n",
2072                                e->src->index, e->dest->index, probability);
2073                     predict_edge (e,
2074                                   recursion ? PRED_LOOP_EXIT_WITH_RECURSION
2075                                   : PRED_LOOP_EXIT, probability);
2076                   }
2077             }
2078           if (loop_bound_var)
2079             predict_iv_comparison (loop, bb, loop_bound_var, loop_iv_base,
2080                                    loop_bound_code,
2081                                    tree_to_shwi (loop_bound_step));
2082         }
2083
2084       /* In the following code
2085          for (loop1)
2086            if (cond)
2087              for (loop2)
2088                body;
2089          guess that cond is unlikely.  */
2090       if (loop_outer (loop)->num)
2091         {
2092           basic_block bb = NULL;
2093           edge preheader_edge = loop_preheader_edge (loop);
2094
2095           if (single_pred_p (preheader_edge->src)
2096               && single_succ_p (preheader_edge->src))
2097             preheader_edge = single_pred_edge (preheader_edge->src);
2098
2099           gimple *stmt = last_stmt (preheader_edge->src);
2100           /* Pattern match fortran loop preheader:
2101              _16 = BUILTIN_EXPECT (_15, 1, PRED_FORTRAN_LOOP_PREHEADER);
2102              _17 = (logical(kind=4)) _16;
2103              if (_17 != 0)
2104                goto <bb 11>;
2105              else
2106                goto <bb 13>;
2107
2108              Loop guard branch prediction says nothing about duplicated loop
2109              headers produced by fortran frontend and in this case we want
2110              to predict paths leading to this preheader.  */
2111
2112           if (stmt
2113               && gimple_code (stmt) == GIMPLE_COND
2114               && gimple_cond_code (stmt) == NE_EXPR
2115               && TREE_CODE (gimple_cond_lhs (stmt)) == SSA_NAME
2116               && integer_zerop (gimple_cond_rhs (stmt)))
2117              {
2118                gimple *call_stmt = SSA_NAME_DEF_STMT (gimple_cond_lhs (stmt));
2119                if (gimple_code (call_stmt) == GIMPLE_ASSIGN
2120                    && gimple_expr_code (call_stmt) == NOP_EXPR
2121                    && TREE_CODE (gimple_assign_rhs1 (call_stmt)) == SSA_NAME)
2122                  call_stmt = SSA_NAME_DEF_STMT (gimple_assign_rhs1 (call_stmt));
2123                if (gimple_call_internal_p (call_stmt, IFN_BUILTIN_EXPECT)
2124                    && TREE_CODE (gimple_call_arg (call_stmt, 2)) == INTEGER_CST
2125                    && tree_fits_uhwi_p (gimple_call_arg (call_stmt, 2))
2126                    && tree_to_uhwi (gimple_call_arg (call_stmt, 2))
2127                         == PRED_FORTRAN_LOOP_PREHEADER)
2128                  bb = preheader_edge->src;
2129              }
2130           if (!bb)
2131             {
2132               if (!dominated_by_p (CDI_DOMINATORS,
2133                                    loop_outer (loop)->latch, loop->header))
2134                 predict_paths_leading_to_edge (loop_preheader_edge (loop),
2135                                                recursion
2136                                                ? PRED_LOOP_GUARD_WITH_RECURSION
2137                                                : PRED_LOOP_GUARD,
2138                                                NOT_TAKEN,
2139                                                loop_outer (loop));
2140             }
2141           else
2142             {
2143               if (!dominated_by_p (CDI_DOMINATORS,
2144                                    loop_outer (loop)->latch, bb))
2145                 predict_paths_leading_to (bb,
2146                                           recursion
2147                                           ? PRED_LOOP_GUARD_WITH_RECURSION
2148                                           : PRED_LOOP_GUARD,
2149                                           NOT_TAKEN,
2150                                           loop_outer (loop));
2151             }
2152         }
2153
2154       /* Free basic blocks from get_loop_body.  */
2155       free (bbs);
2156     }
2157 }
2158
2159 /* Attempt to predict probabilities of BB outgoing edges using local
2160    properties.  */
2161 static void
2162 bb_estimate_probability_locally (basic_block bb)
2163 {
2164   rtx_insn *last_insn = BB_END (bb);
2165   rtx cond;
2166
2167   if (! can_predict_insn_p (last_insn))
2168     return;
2169   cond = get_condition (last_insn, NULL, false, false);
2170   if (! cond)
2171     return;
2172
2173   /* Try "pointer heuristic."
2174      A comparison ptr == 0 is predicted as false.
2175      Similarly, a comparison ptr1 == ptr2 is predicted as false.  */
2176   if (COMPARISON_P (cond)
2177       && ((REG_P (XEXP (cond, 0)) && REG_POINTER (XEXP (cond, 0)))
2178           || (REG_P (XEXP (cond, 1)) && REG_POINTER (XEXP (cond, 1)))))
2179     {
2180       if (GET_CODE (cond) == EQ)
2181         predict_insn_def (last_insn, PRED_POINTER, NOT_TAKEN);
2182       else if (GET_CODE (cond) == NE)
2183         predict_insn_def (last_insn, PRED_POINTER, TAKEN);
2184     }
2185   else
2186
2187   /* Try "opcode heuristic."
2188      EQ tests are usually false and NE tests are usually true. Also,
2189      most quantities are positive, so we can make the appropriate guesses
2190      about signed comparisons against zero.  */
2191     switch (GET_CODE (cond))
2192       {
2193       case CONST_INT:
2194         /* Unconditional branch.  */
2195         predict_insn_def (last_insn, PRED_UNCONDITIONAL,
2196                           cond == const0_rtx ? NOT_TAKEN : TAKEN);
2197         break;
2198
2199       case EQ:
2200       case UNEQ:
2201         /* Floating point comparisons appears to behave in a very
2202            unpredictable way because of special role of = tests in
2203            FP code.  */
2204         if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
2205           ;
2206         /* Comparisons with 0 are often used for booleans and there is
2207            nothing useful to predict about them.  */
2208         else if (XEXP (cond, 1) == const0_rtx
2209                  || XEXP (cond, 0) == const0_rtx)
2210           ;
2211         else
2212           predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, NOT_TAKEN);
2213         break;
2214
2215       case NE:
2216       case LTGT:
2217         /* Floating point comparisons appears to behave in a very
2218            unpredictable way because of special role of = tests in
2219            FP code.  */
2220         if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
2221           ;
2222         /* Comparisons with 0 are often used for booleans and there is
2223            nothing useful to predict about them.  */
2224         else if (XEXP (cond, 1) == const0_rtx
2225                  || XEXP (cond, 0) == const0_rtx)
2226           ;
2227         else
2228           predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, TAKEN);
2229         break;
2230
2231       case ORDERED:
2232         predict_insn_def (last_insn, PRED_FPOPCODE, TAKEN);
2233         break;
2234
2235       case UNORDERED:
2236         predict_insn_def (last_insn, PRED_FPOPCODE, NOT_TAKEN);
2237         break;
2238
2239       case LE:
2240       case LT:
2241         if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
2242             || XEXP (cond, 1) == constm1_rtx)
2243           predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, NOT_TAKEN);
2244         break;
2245
2246       case GE:
2247       case GT:
2248         if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
2249             || XEXP (cond, 1) == constm1_rtx)
2250           predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, TAKEN);
2251         break;
2252
2253       default:
2254         break;
2255       }
2256 }
2257
2258 /* Set edge->probability for each successor edge of BB.  */
2259 void
2260 guess_outgoing_edge_probabilities (basic_block bb)
2261 {
2262   bb_estimate_probability_locally (bb);
2263   combine_predictions_for_insn (BB_END (bb), bb);
2264 }
2265 \f
2266 static tree expr_expected_value (tree, bitmap, enum br_predictor *predictor,
2267                                  HOST_WIDE_INT *probability);
2268
2269 /* Helper function for expr_expected_value.  */
2270
2271 static tree
2272 expr_expected_value_1 (tree type, tree op0, enum tree_code code,
2273                        tree op1, bitmap visited, enum br_predictor *predictor,
2274                        HOST_WIDE_INT *probability)
2275 {
2276   gimple *def;
2277
2278   /* Reset returned probability value.  */
2279   *probability = -1;
2280   *predictor = PRED_UNCONDITIONAL;
2281
2282   if (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS)
2283     {
2284       if (TREE_CONSTANT (op0))
2285         return op0;
2286
2287       if (code == IMAGPART_EXPR)
2288         {
2289           if (TREE_CODE (TREE_OPERAND (op0, 0)) == SSA_NAME)
2290             {
2291               def = SSA_NAME_DEF_STMT (TREE_OPERAND (op0, 0));
2292               if (is_gimple_call (def)
2293                   && gimple_call_internal_p (def)
2294                   && (gimple_call_internal_fn (def)
2295                       == IFN_ATOMIC_COMPARE_EXCHANGE))
2296                 {
2297                   /* Assume that any given atomic operation has low contention,
2298                      and thus the compare-and-swap operation succeeds.  */
2299                   *predictor = PRED_COMPARE_AND_SWAP;
2300                   return build_one_cst (TREE_TYPE (op0));
2301                 }
2302             }
2303         }
2304
2305       if (code != SSA_NAME)
2306         return NULL_TREE;
2307
2308       def = SSA_NAME_DEF_STMT (op0);
2309
2310       /* If we were already here, break the infinite cycle.  */
2311       if (!bitmap_set_bit (visited, SSA_NAME_VERSION (op0)))
2312         return NULL;
2313
2314       if (gimple_code (def) == GIMPLE_PHI)
2315         {
2316           /* All the arguments of the PHI node must have the same constant
2317              length.  */
2318           int i, n = gimple_phi_num_args (def);
2319           tree val = NULL, new_val;
2320
2321           for (i = 0; i < n; i++)
2322             {
2323               tree arg = PHI_ARG_DEF (def, i);
2324               enum br_predictor predictor2;
2325
2326               /* If this PHI has itself as an argument, we cannot
2327                  determine the string length of this argument.  However,
2328                  if we can find an expected constant value for the other
2329                  PHI args then we can still be sure that this is
2330                  likely a constant.  So be optimistic and just
2331                  continue with the next argument.  */
2332               if (arg == PHI_RESULT (def))
2333                 continue;
2334
2335               HOST_WIDE_INT probability2;
2336               new_val = expr_expected_value (arg, visited, &predictor2,
2337                                              &probability2);
2338
2339               /* It is difficult to combine value predictors.  Simply assume
2340                  that later predictor is weaker and take its prediction.  */
2341               if (*predictor < predictor2)
2342                 {
2343                   *predictor = predictor2;
2344                   *probability = probability2;
2345                 }
2346               if (!new_val)
2347                 return NULL;
2348               if (!val)
2349                 val = new_val;
2350               else if (!operand_equal_p (val, new_val, false))
2351                 return NULL;
2352             }
2353           return val;
2354         }
2355       if (is_gimple_assign (def))
2356         {
2357           if (gimple_assign_lhs (def) != op0)
2358             return NULL;
2359
2360           return expr_expected_value_1 (TREE_TYPE (gimple_assign_lhs (def)),
2361                                         gimple_assign_rhs1 (def),
2362                                         gimple_assign_rhs_code (def),
2363                                         gimple_assign_rhs2 (def),
2364                                         visited, predictor, probability);
2365         }
2366
2367       if (is_gimple_call (def))
2368         {
2369           tree decl = gimple_call_fndecl (def);
2370           if (!decl)
2371             {
2372               if (gimple_call_internal_p (def)
2373                   && gimple_call_internal_fn (def) == IFN_BUILTIN_EXPECT)
2374                 {
2375                   gcc_assert (gimple_call_num_args (def) == 3);
2376                   tree val = gimple_call_arg (def, 0);
2377                   if (TREE_CONSTANT (val))
2378                     return val;
2379                   tree val2 = gimple_call_arg (def, 2);
2380                   gcc_assert (TREE_CODE (val2) == INTEGER_CST
2381                               && tree_fits_uhwi_p (val2)
2382                               && tree_to_uhwi (val2) < END_PREDICTORS);
2383                   *predictor = (enum br_predictor) tree_to_uhwi (val2);
2384                   if (*predictor == PRED_BUILTIN_EXPECT)
2385                     *probability
2386                       = HITRATE (PARAM_VALUE (BUILTIN_EXPECT_PROBABILITY));
2387                   return gimple_call_arg (def, 1);
2388                 }
2389               return NULL;
2390             }
2391
2392           if (DECL_IS_MALLOC (decl) || DECL_IS_OPERATOR_NEW (decl))
2393             {
2394               if (predictor)
2395                 *predictor = PRED_MALLOC_NONNULL;
2396               return boolean_true_node;
2397             }
2398
2399           if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
2400             switch (DECL_FUNCTION_CODE (decl))
2401               {
2402               case BUILT_IN_EXPECT:
2403                 {
2404                   tree val;
2405                   if (gimple_call_num_args (def) != 2)
2406                     return NULL;
2407                   val = gimple_call_arg (def, 0);
2408                   if (TREE_CONSTANT (val))
2409                     return val;
2410                   *predictor = PRED_BUILTIN_EXPECT;
2411                   *probability
2412                     = HITRATE (PARAM_VALUE (BUILTIN_EXPECT_PROBABILITY));
2413                   return gimple_call_arg (def, 1);
2414                 }
2415               case BUILT_IN_EXPECT_WITH_PROBABILITY:
2416                 {
2417                   tree val;
2418                   if (gimple_call_num_args (def) != 3)
2419                     return NULL;
2420                   val = gimple_call_arg (def, 0);
2421                   if (TREE_CONSTANT (val))
2422                     return val;
2423                   /* Compute final probability as:
2424                      probability * REG_BR_PROB_BASE.  */
2425                   tree prob = gimple_call_arg (def, 2);
2426                   tree t = TREE_TYPE (prob);
2427                   tree base = build_int_cst (integer_type_node,
2428                                              REG_BR_PROB_BASE);
2429                   base = build_real_from_int_cst (t, base);
2430                   tree r = fold_build2_initializer_loc (UNKNOWN_LOCATION,
2431                                                         MULT_EXPR, t, prob, base);
2432                   HOST_WIDE_INT probi
2433                     = real_to_integer (TREE_REAL_CST_PTR (r));
2434                   if (probi >= 0 && probi <= REG_BR_PROB_BASE)
2435                     {
2436                       *predictor = PRED_BUILTIN_EXPECT_WITH_PROBABILITY;
2437                       *probability = probi;
2438                     }
2439                   return gimple_call_arg (def, 1);
2440                 }
2441
2442               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_N:
2443               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_1:
2444               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_2:
2445               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_4:
2446               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_8:
2447               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_16:
2448               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE:
2449               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_N:
2450               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_1:
2451               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_2:
2452               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_4:
2453               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_8:
2454               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_16:
2455                 /* Assume that any given atomic operation has low contention,
2456                    and thus the compare-and-swap operation succeeds.  */
2457                 *predictor = PRED_COMPARE_AND_SWAP;
2458                 return boolean_true_node;
2459               case BUILT_IN_REALLOC:
2460                 if (predictor)
2461                   *predictor = PRED_MALLOC_NONNULL;
2462                 return boolean_true_node;
2463               default:
2464                 break;
2465             }
2466         }
2467
2468       return NULL;
2469     }
2470
2471   if (get_gimple_rhs_class (code) == GIMPLE_BINARY_RHS)
2472     {
2473       tree res;
2474       enum br_predictor predictor2;
2475       HOST_WIDE_INT probability2;
2476       op0 = expr_expected_value (op0, visited, predictor, probability);
2477       if (!op0)
2478         return NULL;
2479       op1 = expr_expected_value (op1, visited, &predictor2, &probability2);
2480       if (!op1)
2481         return NULL;
2482       res = fold_build2 (code, type, op0, op1);
2483       if (TREE_CODE (res) == INTEGER_CST
2484           && TREE_CODE (op0) == INTEGER_CST
2485           && TREE_CODE (op1) == INTEGER_CST)
2486         {
2487           /* Combine binary predictions.  */
2488           if (*probability != -1 || probability2 != -1)
2489             {
2490               HOST_WIDE_INT p1 = get_predictor_value (*predictor, *probability);
2491               HOST_WIDE_INT p2 = get_predictor_value (predictor2, probability2);
2492               *probability = RDIV (p1 * p2, REG_BR_PROB_BASE);
2493             }
2494
2495           if (*predictor < predictor2)
2496             *predictor = predictor2;
2497
2498           return res;
2499         }
2500       return NULL;
2501     }
2502   if (get_gimple_rhs_class (code) == GIMPLE_UNARY_RHS)
2503     {
2504       tree res;
2505       op0 = expr_expected_value (op0, visited, predictor, probability);
2506       if (!op0)
2507         return NULL;
2508       res = fold_build1 (code, type, op0);
2509       if (TREE_CONSTANT (res))
2510         return res;
2511       return NULL;
2512     }
2513   return NULL;
2514 }
2515
2516 /* Return constant EXPR will likely have at execution time, NULL if unknown.
2517    The function is used by builtin_expect branch predictor so the evidence
2518    must come from this construct and additional possible constant folding.
2519
2520    We may want to implement more involved value guess (such as value range
2521    propagation based prediction), but such tricks shall go to new
2522    implementation.  */
2523
2524 static tree
2525 expr_expected_value (tree expr, bitmap visited,
2526                      enum br_predictor *predictor,
2527                      HOST_WIDE_INT *probability)
2528 {
2529   enum tree_code code;
2530   tree op0, op1;
2531
2532   if (TREE_CONSTANT (expr))
2533     {
2534       *predictor = PRED_UNCONDITIONAL;
2535       *probability = -1;
2536       return expr;
2537     }
2538
2539   extract_ops_from_tree (expr, &code, &op0, &op1);
2540   return expr_expected_value_1 (TREE_TYPE (expr),
2541                                 op0, code, op1, visited, predictor,
2542                                 probability);
2543 }
2544 \f
2545
2546 /* Return probability of a PREDICTOR.  If the predictor has variable
2547    probability return passed PROBABILITY.  */
2548
2549 static HOST_WIDE_INT
2550 get_predictor_value (br_predictor predictor, HOST_WIDE_INT probability)
2551 {
2552   switch (predictor)
2553     {
2554     case PRED_BUILTIN_EXPECT:
2555     case PRED_BUILTIN_EXPECT_WITH_PROBABILITY:
2556       gcc_assert (probability != -1);
2557       return probability;
2558     default:
2559       gcc_assert (probability == -1);
2560       return predictor_info[(int) predictor].hitrate;
2561     }
2562 }
2563
2564 /* Predict using opcode of the last statement in basic block.  */
2565 static void
2566 tree_predict_by_opcode (basic_block bb)
2567 {
2568   gimple *stmt = last_stmt (bb);
2569   edge then_edge;
2570   tree op0, op1;
2571   tree type;
2572   tree val;
2573   enum tree_code cmp;
2574   edge_iterator ei;
2575   enum br_predictor predictor;
2576   HOST_WIDE_INT probability;
2577
2578   if (!stmt || gimple_code (stmt) != GIMPLE_COND)
2579     return;
2580   FOR_EACH_EDGE (then_edge, ei, bb->succs)
2581     if (then_edge->flags & EDGE_TRUE_VALUE)
2582       break;
2583   op0 = gimple_cond_lhs (stmt);
2584   op1 = gimple_cond_rhs (stmt);
2585   cmp = gimple_cond_code (stmt);
2586   type = TREE_TYPE (op0);
2587   val = expr_expected_value_1 (boolean_type_node, op0, cmp, op1, auto_bitmap (),
2588                                &predictor, &probability);
2589   if (val && TREE_CODE (val) == INTEGER_CST)
2590     {
2591       HOST_WIDE_INT prob = get_predictor_value (predictor, probability);
2592       if (integer_zerop (val))
2593         prob = REG_BR_PROB_BASE - prob;
2594       predict_edge (then_edge, predictor, prob);
2595     }
2596   /* Try "pointer heuristic."
2597      A comparison ptr == 0 is predicted as false.
2598      Similarly, a comparison ptr1 == ptr2 is predicted as false.  */
2599   if (POINTER_TYPE_P (type))
2600     {
2601       if (cmp == EQ_EXPR)
2602         predict_edge_def (then_edge, PRED_TREE_POINTER, NOT_TAKEN);
2603       else if (cmp == NE_EXPR)
2604         predict_edge_def (then_edge, PRED_TREE_POINTER, TAKEN);
2605     }
2606   else
2607
2608   /* Try "opcode heuristic."
2609      EQ tests are usually false and NE tests are usually true. Also,
2610      most quantities are positive, so we can make the appropriate guesses
2611      about signed comparisons against zero.  */
2612     switch (cmp)
2613       {
2614       case EQ_EXPR:
2615       case UNEQ_EXPR:
2616         /* Floating point comparisons appears to behave in a very
2617            unpredictable way because of special role of = tests in
2618            FP code.  */
2619         if (FLOAT_TYPE_P (type))
2620           ;
2621         /* Comparisons with 0 are often used for booleans and there is
2622            nothing useful to predict about them.  */
2623         else if (integer_zerop (op0) || integer_zerop (op1))
2624           ;
2625         else
2626           predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, NOT_TAKEN);
2627         break;
2628
2629       case NE_EXPR:
2630       case LTGT_EXPR:
2631         /* Floating point comparisons appears to behave in a very
2632            unpredictable way because of special role of = tests in
2633            FP code.  */
2634         if (FLOAT_TYPE_P (type))
2635           ;
2636         /* Comparisons with 0 are often used for booleans and there is
2637            nothing useful to predict about them.  */
2638         else if (integer_zerop (op0)
2639                  || integer_zerop (op1))
2640           ;
2641         else
2642           predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, TAKEN);
2643         break;
2644
2645       case ORDERED_EXPR:
2646         predict_edge_def (then_edge, PRED_TREE_FPOPCODE, TAKEN);
2647         break;
2648
2649       case UNORDERED_EXPR:
2650         predict_edge_def (then_edge, PRED_TREE_FPOPCODE, NOT_TAKEN);
2651         break;
2652
2653       case LE_EXPR:
2654       case LT_EXPR:
2655         if (integer_zerop (op1)
2656             || integer_onep (op1)
2657             || integer_all_onesp (op1)
2658             || real_zerop (op1)
2659             || real_onep (op1)
2660             || real_minus_onep (op1))
2661           predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, NOT_TAKEN);
2662         break;
2663
2664       case GE_EXPR:
2665       case GT_EXPR:
2666         if (integer_zerop (op1)
2667             || integer_onep (op1)
2668             || integer_all_onesp (op1)
2669             || real_zerop (op1)
2670             || real_onep (op1)
2671             || real_minus_onep (op1))
2672           predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, TAKEN);
2673         break;
2674
2675       default:
2676         break;
2677       }
2678 }
2679
2680 /* Returns TRUE if the STMT is exit(0) like statement. */
2681
2682 static bool
2683 is_exit_with_zero_arg (const gimple *stmt)
2684 {
2685   /* This is not exit, _exit or _Exit. */
2686   if (!gimple_call_builtin_p (stmt, BUILT_IN_EXIT)
2687       && !gimple_call_builtin_p (stmt, BUILT_IN__EXIT)
2688       && !gimple_call_builtin_p (stmt, BUILT_IN__EXIT2))
2689     return false;
2690
2691   /* Argument is an interger zero. */
2692   return integer_zerop (gimple_call_arg (stmt, 0));
2693 }
2694
2695 /* Try to guess whether the value of return means error code.  */
2696
2697 static enum br_predictor
2698 return_prediction (tree val, enum prediction *prediction)
2699 {
2700   /* VOID.  */
2701   if (!val)
2702     return PRED_NO_PREDICTION;
2703   /* Different heuristics for pointers and scalars.  */
2704   if (POINTER_TYPE_P (TREE_TYPE (val)))
2705     {
2706       /* NULL is usually not returned.  */
2707       if (integer_zerop (val))
2708         {
2709           *prediction = NOT_TAKEN;
2710           return PRED_NULL_RETURN;
2711         }
2712     }
2713   else if (INTEGRAL_TYPE_P (TREE_TYPE (val)))
2714     {
2715       /* Negative return values are often used to indicate
2716          errors.  */
2717       if (TREE_CODE (val) == INTEGER_CST
2718           && tree_int_cst_sgn (val) < 0)
2719         {
2720           *prediction = NOT_TAKEN;
2721           return PRED_NEGATIVE_RETURN;
2722         }
2723       /* Constant return values seems to be commonly taken.
2724          Zero/one often represent booleans so exclude them from the
2725          heuristics.  */
2726       if (TREE_CONSTANT (val)
2727           && (!integer_zerop (val) && !integer_onep (val)))
2728         {
2729           *prediction = NOT_TAKEN;
2730           return PRED_CONST_RETURN;
2731         }
2732     }
2733   return PRED_NO_PREDICTION;
2734 }
2735
2736 /* Return zero if phi result could have values other than -1, 0 or 1,
2737    otherwise return a bitmask, with bits 0, 1 and 2 set if -1, 0 and 1
2738    values are used or likely.  */
2739
2740 static int
2741 zero_one_minusone (gphi *phi, int limit)
2742 {
2743   int phi_num_args = gimple_phi_num_args (phi);
2744   int ret = 0;
2745   for (int i = 0; i < phi_num_args; i++)
2746     {
2747       tree t = PHI_ARG_DEF (phi, i);
2748       if (TREE_CODE (t) != INTEGER_CST)
2749         continue;
2750       wide_int w = wi::to_wide (t);
2751       if (w == -1)
2752         ret |= 1;
2753       else if (w == 0)
2754         ret |= 2;
2755       else if (w == 1)
2756         ret |= 4;
2757       else
2758         return 0;
2759     }
2760   for (int i = 0; i < phi_num_args; i++)
2761     {
2762       tree t = PHI_ARG_DEF (phi, i);
2763       if (TREE_CODE (t) == INTEGER_CST)
2764         continue;
2765       if (TREE_CODE (t) != SSA_NAME)
2766         return 0;
2767       gimple *g = SSA_NAME_DEF_STMT (t);
2768       if (gimple_code (g) == GIMPLE_PHI && limit > 0)
2769         if (int r = zero_one_minusone (as_a <gphi *> (g), limit - 1))
2770           {
2771             ret |= r;
2772             continue;
2773           }
2774       if (!is_gimple_assign (g))
2775         return 0;
2776       if (gimple_assign_cast_p (g))
2777         {
2778           tree rhs1 = gimple_assign_rhs1 (g);
2779           if (TREE_CODE (rhs1) != SSA_NAME
2780               || !INTEGRAL_TYPE_P (TREE_TYPE (rhs1))
2781               || TYPE_PRECISION (TREE_TYPE (rhs1)) != 1
2782               || !TYPE_UNSIGNED (TREE_TYPE (rhs1)))
2783             return 0;
2784           ret |= (2 | 4);
2785           continue;
2786         }
2787       if (TREE_CODE_CLASS (gimple_assign_rhs_code (g)) != tcc_comparison)
2788         return 0;
2789       ret |= (2 | 4);
2790     }
2791   return ret;
2792 }
2793
2794 /* Find the basic block with return expression and look up for possible
2795    return value trying to apply RETURN_PREDICTION heuristics.  */
2796 static void
2797 apply_return_prediction (void)
2798 {
2799   greturn *return_stmt = NULL;
2800   tree return_val;
2801   edge e;
2802   gphi *phi;
2803   int phi_num_args, i;
2804   enum br_predictor pred;
2805   enum prediction direction;
2806   edge_iterator ei;
2807
2808   FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
2809     {
2810       gimple *last = last_stmt (e->src);
2811       if (last
2812           && gimple_code (last) == GIMPLE_RETURN)
2813         {
2814           return_stmt = as_a <greturn *> (last);
2815           break;
2816         }
2817     }
2818   if (!e)
2819     return;
2820   return_val = gimple_return_retval (return_stmt);
2821   if (!return_val)
2822     return;
2823   if (TREE_CODE (return_val) != SSA_NAME
2824       || !SSA_NAME_DEF_STMT (return_val)
2825       || gimple_code (SSA_NAME_DEF_STMT (return_val)) != GIMPLE_PHI)
2826     return;
2827   phi = as_a <gphi *> (SSA_NAME_DEF_STMT (return_val));
2828   phi_num_args = gimple_phi_num_args (phi);
2829   pred = return_prediction (PHI_ARG_DEF (phi, 0), &direction);
2830
2831   /* Avoid the case where the function returns -1, 0 and 1 values and
2832      nothing else.  Those could be qsort etc. comparison functions
2833      where the negative return isn't less probable than positive.
2834      For this require that the function returns at least -1 or 1
2835      or -1 and a boolean value or comparison result, so that functions
2836      returning just -1 and 0 are treated as if -1 represents error value.  */
2837   if (INTEGRAL_TYPE_P (TREE_TYPE (return_val))
2838       && !TYPE_UNSIGNED (TREE_TYPE (return_val))
2839       && TYPE_PRECISION (TREE_TYPE (return_val)) > 1)
2840     if (int r = zero_one_minusone (phi, 3))
2841       if ((r & (1 | 4)) == (1 | 4))
2842         return;
2843
2844   /* Avoid the degenerate case where all return values form the function
2845      belongs to same category (ie they are all positive constants)
2846      so we can hardly say something about them.  */
2847   for (i = 1; i < phi_num_args; i++)
2848     if (pred != return_prediction (PHI_ARG_DEF (phi, i), &direction))
2849       break;
2850   if (i != phi_num_args)
2851     for (i = 0; i < phi_num_args; i++)
2852       {
2853         pred = return_prediction (PHI_ARG_DEF (phi, i), &direction);
2854         if (pred != PRED_NO_PREDICTION)
2855           predict_paths_leading_to_edge (gimple_phi_arg_edge (phi, i), pred,
2856                                          direction);
2857       }
2858 }
2859
2860 /* Look for basic block that contains unlikely to happen events
2861    (such as noreturn calls) and mark all paths leading to execution
2862    of this basic blocks as unlikely.  */
2863
2864 static void
2865 tree_bb_level_predictions (void)
2866 {
2867   basic_block bb;
2868   bool has_return_edges = false;
2869   edge e;
2870   edge_iterator ei;
2871
2872   FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
2873     if (!unlikely_executed_edge_p (e) && !(e->flags & EDGE_ABNORMAL_CALL))
2874       {
2875         has_return_edges = true;
2876         break;
2877       }
2878
2879   apply_return_prediction ();
2880
2881   FOR_EACH_BB_FN (bb, cfun)
2882     {
2883       gimple_stmt_iterator gsi;
2884
2885       for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2886         {
2887           gimple *stmt = gsi_stmt (gsi);
2888           tree decl;
2889
2890           if (is_gimple_call (stmt))
2891             {
2892               if (gimple_call_noreturn_p (stmt)
2893                   && has_return_edges
2894                   && !is_exit_with_zero_arg (stmt))
2895                 predict_paths_leading_to (bb, PRED_NORETURN,
2896                                           NOT_TAKEN);
2897               decl = gimple_call_fndecl (stmt);
2898               if (decl
2899                   && lookup_attribute ("cold",
2900                                        DECL_ATTRIBUTES (decl)))
2901                 predict_paths_leading_to (bb, PRED_COLD_FUNCTION,
2902                                           NOT_TAKEN);
2903               if (decl && recursive_call_p (current_function_decl, decl))
2904                 predict_paths_leading_to (bb, PRED_RECURSIVE_CALL,
2905                                           NOT_TAKEN);
2906             }
2907           else if (gimple_code (stmt) == GIMPLE_PREDICT)
2908             {
2909               predict_paths_leading_to (bb, gimple_predict_predictor (stmt),
2910                                         gimple_predict_outcome (stmt));
2911               /* Keep GIMPLE_PREDICT around so early inlining will propagate
2912                  hints to callers.  */
2913             }
2914         }
2915     }
2916 }
2917
2918 /* Callback for hash_map::traverse, asserts that the pointer map is
2919    empty.  */
2920
2921 bool
2922 assert_is_empty (const_basic_block const &, edge_prediction *const &value,
2923                  void *)
2924 {
2925   gcc_assert (!value);
2926   return false;
2927 }
2928
2929 /* Predict branch probabilities and estimate profile for basic block BB.
2930    When LOCAL_ONLY is set do not use any global properties of CFG.  */
2931
2932 static void
2933 tree_estimate_probability_bb (basic_block bb, bool local_only)
2934 {
2935   edge e;
2936   edge_iterator ei;
2937
2938   FOR_EACH_EDGE (e, ei, bb->succs)
2939     {
2940       /* Look for block we are guarding (ie we dominate it,
2941          but it doesn't postdominate us).  */
2942       if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun) && e->dest != bb
2943           && !local_only
2944           && dominated_by_p (CDI_DOMINATORS, e->dest, e->src)
2945           && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e->dest))
2946         {
2947           gimple_stmt_iterator bi;
2948
2949           /* The call heuristic claims that a guarded function call
2950              is improbable.  This is because such calls are often used
2951              to signal exceptional situations such as printing error
2952              messages.  */
2953           for (bi = gsi_start_bb (e->dest); !gsi_end_p (bi);
2954                gsi_next (&bi))
2955             {
2956               gimple *stmt = gsi_stmt (bi);
2957               if (is_gimple_call (stmt)
2958                   && !gimple_inexpensive_call_p (as_a <gcall *>  (stmt))
2959                   /* Constant and pure calls are hardly used to signalize
2960                      something exceptional.  */
2961                   && gimple_has_side_effects (stmt))
2962                 {
2963                   if (gimple_call_fndecl (stmt))
2964                     predict_edge_def (e, PRED_CALL, NOT_TAKEN);
2965                   else if (virtual_method_call_p (gimple_call_fn (stmt)))
2966                     predict_edge_def (e, PRED_POLYMORPHIC_CALL, NOT_TAKEN);
2967                   else
2968                     predict_edge_def (e, PRED_INDIR_CALL, TAKEN);
2969                   break;
2970                 }
2971             }
2972         }
2973     }
2974   tree_predict_by_opcode (bb);
2975 }
2976
2977 /* Predict branch probabilities and estimate profile of the tree CFG.
2978    This function can be called from the loop optimizers to recompute
2979    the profile information.
2980    If DRY_RUN is set, do not modify CFG and only produce dump files.  */
2981
2982 void
2983 tree_estimate_probability (bool dry_run)
2984 {
2985   basic_block bb;
2986
2987   add_noreturn_fake_exit_edges ();
2988   connect_infinite_loops_to_exit ();
2989   /* We use loop_niter_by_eval, which requires that the loops have
2990      preheaders.  */
2991   create_preheaders (CP_SIMPLE_PREHEADERS);
2992   calculate_dominance_info (CDI_POST_DOMINATORS);
2993
2994   bb_predictions = new hash_map<const_basic_block, edge_prediction *>;
2995   tree_bb_level_predictions ();
2996   record_loop_exits ();
2997
2998   if (number_of_loops (cfun) > 1)
2999     predict_loops ();
3000
3001   FOR_EACH_BB_FN (bb, cfun)
3002     tree_estimate_probability_bb (bb, false);
3003
3004   FOR_EACH_BB_FN (bb, cfun)
3005     combine_predictions_for_bb (bb, dry_run);
3006
3007   if (flag_checking)
3008     bb_predictions->traverse<void *, assert_is_empty> (NULL);
3009
3010   delete bb_predictions;
3011   bb_predictions = NULL;
3012
3013   if (!dry_run)
3014     estimate_bb_frequencies (false);
3015   free_dominance_info (CDI_POST_DOMINATORS);
3016   remove_fake_exit_edges ();
3017 }
3018
3019 /* Set edge->probability for each successor edge of BB.  */
3020 void
3021 tree_guess_outgoing_edge_probabilities (basic_block bb)
3022 {
3023   bb_predictions = new hash_map<const_basic_block, edge_prediction *>;
3024   tree_estimate_probability_bb (bb, true);
3025   combine_predictions_for_bb (bb, false);
3026   if (flag_checking)
3027     bb_predictions->traverse<void *, assert_is_empty> (NULL);
3028   delete bb_predictions;
3029   bb_predictions = NULL;
3030 }
3031 \f
3032 /* Predict edges to successors of CUR whose sources are not postdominated by
3033    BB by PRED and recurse to all postdominators.  */
3034
3035 static void
3036 predict_paths_for_bb (basic_block cur, basic_block bb,
3037                       enum br_predictor pred,
3038                       enum prediction taken,
3039                       bitmap visited, struct loop *in_loop = NULL)
3040 {
3041   edge e;
3042   edge_iterator ei;
3043   basic_block son;
3044
3045   /* If we exited the loop or CUR is unconditional in the loop, there is
3046      nothing to do.  */
3047   if (in_loop
3048       && (!flow_bb_inside_loop_p (in_loop, cur)
3049           || dominated_by_p (CDI_DOMINATORS, in_loop->latch, cur)))
3050     return;
3051
3052   /* We are looking for all edges forming edge cut induced by
3053      set of all blocks postdominated by BB.  */
3054   FOR_EACH_EDGE (e, ei, cur->preds)
3055     if (e->src->index >= NUM_FIXED_BLOCKS
3056         && !dominated_by_p (CDI_POST_DOMINATORS, e->src, bb))
3057     {
3058       edge e2;
3059       edge_iterator ei2;
3060       bool found = false;
3061
3062       /* Ignore fake edges and eh, we predict them as not taken anyway.  */
3063       if (unlikely_executed_edge_p (e))
3064         continue;
3065       gcc_assert (bb == cur || dominated_by_p (CDI_POST_DOMINATORS, cur, bb));
3066
3067       /* See if there is an edge from e->src that is not abnormal
3068          and does not lead to BB and does not exit the loop.  */
3069       FOR_EACH_EDGE (e2, ei2, e->src->succs)
3070         if (e2 != e
3071             && !unlikely_executed_edge_p (e2)
3072             && !dominated_by_p (CDI_POST_DOMINATORS, e2->dest, bb)
3073             && (!in_loop || !loop_exit_edge_p (in_loop, e2)))
3074           {
3075             found = true;
3076             break;
3077           }
3078
3079       /* If there is non-abnormal path leaving e->src, predict edge
3080          using predictor.  Otherwise we need to look for paths
3081          leading to e->src.
3082
3083          The second may lead to infinite loop in the case we are predicitng
3084          regions that are only reachable by abnormal edges.  We simply
3085          prevent visiting given BB twice.  */
3086       if (found)
3087         {
3088           if (!edge_predicted_by_p (e, pred, taken))
3089             predict_edge_def (e, pred, taken);
3090         }
3091       else if (bitmap_set_bit (visited, e->src->index))
3092         predict_paths_for_bb (e->src, e->src, pred, taken, visited, in_loop);
3093     }
3094   for (son = first_dom_son (CDI_POST_DOMINATORS, cur);
3095        son;
3096        son = next_dom_son (CDI_POST_DOMINATORS, son))
3097     predict_paths_for_bb (son, bb, pred, taken, visited, in_loop);
3098 }
3099
3100 /* Sets branch probabilities according to PREDiction and
3101    FLAGS.  */
3102
3103 static void
3104 predict_paths_leading_to (basic_block bb, enum br_predictor pred,
3105                           enum prediction taken, struct loop *in_loop)
3106 {
3107   predict_paths_for_bb (bb, bb, pred, taken, auto_bitmap (), in_loop);
3108 }
3109
3110 /* Like predict_paths_leading_to but take edge instead of basic block.  */
3111
3112 static void
3113 predict_paths_leading_to_edge (edge e, enum br_predictor pred,
3114                                enum prediction taken, struct loop *in_loop)
3115 {
3116   bool has_nonloop_edge = false;
3117   edge_iterator ei;
3118   edge e2;
3119
3120   basic_block bb = e->src;
3121   FOR_EACH_EDGE (e2, ei, bb->succs)
3122     if (e2->dest != e->src && e2->dest != e->dest
3123         && !unlikely_executed_edge_p (e)
3124         && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e2->dest))
3125       {
3126         has_nonloop_edge = true;
3127         break;
3128       }
3129   if (!has_nonloop_edge)
3130     {
3131       predict_paths_for_bb (bb, bb, pred, taken, auto_bitmap (), in_loop);
3132     }
3133   else
3134     predict_edge_def (e, pred, taken);
3135 }
3136 \f
3137 /* This is used to carry information about basic blocks.  It is
3138    attached to the AUX field of the standard CFG block.  */
3139
3140 struct block_info
3141 {
3142   /* Estimated frequency of execution of basic_block.  */
3143   sreal frequency;
3144
3145   /* To keep queue of basic blocks to process.  */
3146   basic_block next;
3147
3148   /* Number of predecessors we need to visit first.  */
3149   int npredecessors;
3150 };
3151
3152 /* Similar information for edges.  */
3153 struct edge_prob_info
3154 {
3155   /* In case edge is a loopback edge, the probability edge will be reached
3156      in case header is.  Estimated number of iterations of the loop can be
3157      then computed as 1 / (1 - back_edge_prob).  */
3158   sreal back_edge_prob;
3159   /* True if the edge is a loopback edge in the natural loop.  */
3160   unsigned int back_edge:1;
3161 };
3162
3163 #define BLOCK_INFO(B)   ((block_info *) (B)->aux)
3164 #undef EDGE_INFO
3165 #define EDGE_INFO(E)    ((edge_prob_info *) (E)->aux)
3166
3167 /* Helper function for estimate_bb_frequencies.
3168    Propagate the frequencies in blocks marked in
3169    TOVISIT, starting in HEAD.  */
3170
3171 static void
3172 propagate_freq (basic_block head, bitmap tovisit)
3173 {
3174   basic_block bb;
3175   basic_block last;
3176   unsigned i;
3177   edge e;
3178   basic_block nextbb;
3179   bitmap_iterator bi;
3180
3181   /* For each basic block we need to visit count number of his predecessors
3182      we need to visit first.  */
3183   EXECUTE_IF_SET_IN_BITMAP (tovisit, 0, i, bi)
3184     {
3185       edge_iterator ei;
3186       int count = 0;
3187
3188       bb = BASIC_BLOCK_FOR_FN (cfun, i);
3189
3190       FOR_EACH_EDGE (e, ei, bb->preds)
3191         {
3192           bool visit = bitmap_bit_p (tovisit, e->src->index);
3193
3194           if (visit && !(e->flags & EDGE_DFS_BACK))
3195             count++;
3196           else if (visit && dump_file && !EDGE_INFO (e)->back_edge)
3197             fprintf (dump_file,
3198                      "Irreducible region hit, ignoring edge to %i->%i\n",
3199                      e->src->index, bb->index);
3200         }
3201       BLOCK_INFO (bb)->npredecessors = count;
3202       /* When function never returns, we will never process exit block.  */
3203       if (!count && bb == EXIT_BLOCK_PTR_FOR_FN (cfun))
3204         bb->count = profile_count::zero ();
3205     }
3206
3207   BLOCK_INFO (head)->frequency = 1;
3208   last = head;
3209   for (bb = head; bb; bb = nextbb)
3210     {
3211       edge_iterator ei;
3212       sreal cyclic_probability = 0;
3213       sreal frequency = 0;
3214
3215       nextbb = BLOCK_INFO (bb)->next;
3216       BLOCK_INFO (bb)->next = NULL;
3217
3218       /* Compute frequency of basic block.  */
3219       if (bb != head)
3220         {
3221           if (flag_checking)
3222             FOR_EACH_EDGE (e, ei, bb->preds)
3223               gcc_assert (!bitmap_bit_p (tovisit, e->src->index)
3224                           || (e->flags & EDGE_DFS_BACK));
3225
3226           FOR_EACH_EDGE (e, ei, bb->preds)
3227             if (EDGE_INFO (e)->back_edge)
3228               {
3229                 cyclic_probability += EDGE_INFO (e)->back_edge_prob;
3230               }
3231             else if (!(e->flags & EDGE_DFS_BACK))
3232               {
3233                 /*  frequency += (e->probability
3234                                   * BLOCK_INFO (e->src)->frequency /
3235                                   REG_BR_PROB_BASE);  */
3236
3237                 /* FIXME: Graphite is producing edges with no profile. Once
3238                    this is fixed, drop this.  */
3239                 sreal tmp = e->probability.initialized_p () ?
3240                             e->probability.to_reg_br_prob_base () : 0;
3241                 tmp *= BLOCK_INFO (e->src)->frequency;
3242                 tmp *= real_inv_br_prob_base;
3243                 frequency += tmp;
3244               }
3245
3246           if (cyclic_probability == 0)
3247             {
3248               BLOCK_INFO (bb)->frequency = frequency;
3249             }
3250           else
3251             {
3252               if (cyclic_probability > real_almost_one)
3253                 cyclic_probability = real_almost_one;
3254
3255               /* BLOCK_INFO (bb)->frequency = frequency
3256                                               / (1 - cyclic_probability) */
3257
3258               cyclic_probability = sreal (1) - cyclic_probability;
3259               BLOCK_INFO (bb)->frequency = frequency / cyclic_probability;
3260             }
3261         }
3262
3263       bitmap_clear_bit (tovisit, bb->index);
3264
3265       e = find_edge (bb, head);
3266       if (e)
3267         {
3268           /* EDGE_INFO (e)->back_edge_prob
3269              = ((e->probability * BLOCK_INFO (bb)->frequency)
3270              / REG_BR_PROB_BASE); */
3271
3272           /* FIXME: Graphite is producing edges with no profile. Once
3273              this is fixed, drop this.  */
3274           sreal tmp = e->probability.initialized_p () ?
3275                       e->probability.to_reg_br_prob_base () : 0;
3276           tmp *= BLOCK_INFO (bb)->frequency;
3277           EDGE_INFO (e)->back_edge_prob = tmp * real_inv_br_prob_base;
3278         }
3279
3280       /* Propagate to successor blocks.  */
3281       FOR_EACH_EDGE (e, ei, bb->succs)
3282         if (!(e->flags & EDGE_DFS_BACK)
3283             && BLOCK_INFO (e->dest)->npredecessors)
3284           {
3285             BLOCK_INFO (e->dest)->npredecessors--;
3286             if (!BLOCK_INFO (e->dest)->npredecessors)
3287               {
3288                 if (!nextbb)
3289                   nextbb = e->dest;
3290                 else
3291                   BLOCK_INFO (last)->next = e->dest;
3292
3293                 last = e->dest;
3294               }
3295           }
3296     }
3297 }
3298
3299 /* Estimate frequencies in loops at same nest level.  */
3300
3301 static void
3302 estimate_loops_at_level (struct loop *first_loop)
3303 {
3304   struct loop *loop;
3305
3306   for (loop = first_loop; loop; loop = loop->next)
3307     {
3308       edge e;
3309       basic_block *bbs;
3310       unsigned i;
3311       auto_bitmap tovisit;
3312
3313       estimate_loops_at_level (loop->inner);
3314
3315       /* Find current loop back edge and mark it.  */
3316       e = loop_latch_edge (loop);
3317       EDGE_INFO (e)->back_edge = 1;
3318
3319       bbs = get_loop_body (loop);
3320       for (i = 0; i < loop->num_nodes; i++)
3321         bitmap_set_bit (tovisit, bbs[i]->index);
3322       free (bbs);
3323       propagate_freq (loop->header, tovisit);
3324     }
3325 }
3326
3327 /* Propagates frequencies through structure of loops.  */
3328
3329 static void
3330 estimate_loops (void)
3331 {
3332   auto_bitmap tovisit;
3333   basic_block bb;
3334
3335   /* Start by estimating the frequencies in the loops.  */
3336   if (number_of_loops (cfun) > 1)
3337     estimate_loops_at_level (current_loops->tree_root->inner);
3338
3339   /* Now propagate the frequencies through all the blocks.  */
3340   FOR_ALL_BB_FN (bb, cfun)
3341     {
3342       bitmap_set_bit (tovisit, bb->index);
3343     }
3344   propagate_freq (ENTRY_BLOCK_PTR_FOR_FN (cfun), tovisit);
3345 }
3346
3347 /* Drop the profile for NODE to guessed, and update its frequency based on
3348    whether it is expected to be hot given the CALL_COUNT.  */
3349
3350 static void
3351 drop_profile (struct cgraph_node *node, profile_count call_count)
3352 {
3353   struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
3354   /* In the case where this was called by another function with a
3355      dropped profile, call_count will be 0. Since there are no
3356      non-zero call counts to this function, we don't know for sure
3357      whether it is hot, and therefore it will be marked normal below.  */
3358   bool hot = maybe_hot_count_p (NULL, call_count);
3359
3360   if (dump_file)
3361     fprintf (dump_file,
3362              "Dropping 0 profile for %s. %s based on calls.\n",
3363              node->dump_name (),
3364              hot ? "Function is hot" : "Function is normal");
3365   /* We only expect to miss profiles for functions that are reached
3366      via non-zero call edges in cases where the function may have
3367      been linked from another module or library (COMDATs and extern
3368      templates). See the comments below for handle_missing_profiles.
3369      Also, only warn in cases where the missing counts exceed the
3370      number of training runs. In certain cases with an execv followed
3371      by a no-return call the profile for the no-return call is not
3372      dumped and there can be a mismatch.  */
3373   if (!DECL_COMDAT (node->decl) && !DECL_EXTERNAL (node->decl)
3374       && call_count > profile_info->runs)
3375     {
3376       if (flag_profile_correction)
3377         {
3378           if (dump_file)
3379             fprintf (dump_file,
3380                      "Missing counts for called function %s\n",
3381                      node->dump_name ());
3382         }
3383       else
3384         warning (0, "Missing counts for called function %s",
3385                  node->dump_name ());
3386     }
3387
3388   basic_block bb;
3389   if (opt_for_fn (node->decl, flag_guess_branch_prob))
3390     {
3391       bool clear_zeros
3392          = !ENTRY_BLOCK_PTR_FOR_FN (fn)->count.nonzero_p ();
3393       FOR_ALL_BB_FN (bb, fn)
3394         if (clear_zeros || !(bb->count == profile_count::zero ()))
3395           bb->count = bb->count.guessed_local ();
3396       fn->cfg->count_max = fn->cfg->count_max.guessed_local ();
3397     }
3398   else
3399     {
3400       FOR_ALL_BB_FN (bb, fn)
3401         bb->count = profile_count::uninitialized ();
3402       fn->cfg->count_max = profile_count::uninitialized ();
3403     }
3404
3405   struct cgraph_edge *e;
3406   for (e = node->callees; e; e = e->next_callee)
3407     e->count = gimple_bb (e->call_stmt)->count;
3408   for (e = node->indirect_calls; e; e = e->next_callee)
3409     e->count = gimple_bb (e->call_stmt)->count;
3410   node->count = ENTRY_BLOCK_PTR_FOR_FN (fn)->count;
3411
3412   profile_status_for_fn (fn)
3413       = (flag_guess_branch_prob ? PROFILE_GUESSED : PROFILE_ABSENT);
3414   node->frequency
3415       = hot ? NODE_FREQUENCY_HOT : NODE_FREQUENCY_NORMAL;
3416 }
3417
3418 /* In the case of COMDAT routines, multiple object files will contain the same
3419    function and the linker will select one for the binary. In that case
3420    all the other copies from the profile instrument binary will be missing
3421    profile counts. Look for cases where this happened, due to non-zero
3422    call counts going to 0-count functions, and drop the profile to guessed
3423    so that we can use the estimated probabilities and avoid optimizing only
3424    for size.
3425
3426    The other case where the profile may be missing is when the routine
3427    is not going to be emitted to the object file, e.g. for "extern template"
3428    class methods. Those will be marked DECL_EXTERNAL. Emit a warning in
3429    all other cases of non-zero calls to 0-count functions.  */
3430
3431 void
3432 handle_missing_profiles (void)
3433 {
3434   struct cgraph_node *node;
3435   int unlikely_count_fraction = PARAM_VALUE (UNLIKELY_BB_COUNT_FRACTION);
3436   auto_vec<struct cgraph_node *, 64> worklist;
3437
3438   /* See if 0 count function has non-0 count callers.  In this case we
3439      lost some profile.  Drop its function profile to PROFILE_GUESSED.  */
3440   FOR_EACH_DEFINED_FUNCTION (node)
3441     {
3442       struct cgraph_edge *e;
3443       profile_count call_count = profile_count::zero ();
3444       gcov_type max_tp_first_run = 0;
3445       struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
3446
3447       if (node->count.ipa ().nonzero_p ())
3448         continue;
3449       for (e = node->callers; e; e = e->next_caller)
3450         if (e->count.ipa ().initialized_p () && e->count.ipa () > 0)
3451           {
3452             call_count = call_count + e->count.ipa ();
3453
3454             if (e->caller->tp_first_run > max_tp_first_run)
3455               max_tp_first_run = e->caller->tp_first_run;
3456           }
3457
3458       /* If time profile is missing, let assign the maximum that comes from
3459          caller functions.  */
3460       if (!node->tp_first_run && max_tp_first_run)
3461         node->tp_first_run = max_tp_first_run + 1;
3462
3463       if (call_count > 0
3464           && fn && fn->cfg
3465           && (call_count.apply_scale (unlikely_count_fraction, 1)
3466               >= profile_info->runs))
3467         {
3468           drop_profile (node, call_count);
3469           worklist.safe_push (node);
3470         }
3471     }
3472
3473   /* Propagate the profile dropping to other 0-count COMDATs that are
3474      potentially called by COMDATs we already dropped the profile on.  */
3475   while (worklist.length () > 0)
3476     {
3477       struct cgraph_edge *e;
3478
3479       node = worklist.pop ();
3480       for (e = node->callees; e; e = e->next_caller)
3481         {
3482           struct cgraph_node *callee = e->callee;
3483           struct function *fn = DECL_STRUCT_FUNCTION (callee->decl);
3484
3485           if (!(e->count.ipa () == profile_count::zero ())
3486               && callee->count.ipa ().nonzero_p ())
3487             continue;
3488           if ((DECL_COMDAT (callee->decl) || DECL_EXTERNAL (callee->decl))
3489               && fn && fn->cfg
3490               && profile_status_for_fn (fn) == PROFILE_READ)
3491             {
3492               drop_profile (node, profile_count::zero ());
3493               worklist.safe_push (callee);
3494             }
3495         }
3496     }
3497 }
3498
3499 /* Convert counts measured by profile driven feedback to frequencies.
3500    Return nonzero iff there was any nonzero execution count.  */
3501
3502 bool
3503 update_max_bb_count (void)
3504 {
3505   profile_count true_count_max = profile_count::uninitialized ();
3506   basic_block bb;
3507
3508   FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3509     true_count_max = true_count_max.max (bb->count);
3510
3511   cfun->cfg->count_max = true_count_max;
3512
3513   return true_count_max.ipa ().nonzero_p ();
3514 }
3515
3516 /* Return true if function is likely to be expensive, so there is no point to
3517    optimize performance of prologue, epilogue or do inlining at the expense
3518    of code size growth.  THRESHOLD is the limit of number of instructions
3519    function can execute at average to be still considered not expensive.  */
3520
3521 bool
3522 expensive_function_p (int threshold)
3523 {
3524   basic_block bb;
3525
3526   /* If profile was scaled in a way entry block has count 0, then the function
3527      is deifnitly taking a lot of time.  */
3528   if (!ENTRY_BLOCK_PTR_FOR_FN (cfun)->count.nonzero_p ())
3529     return true;
3530
3531   profile_count limit = ENTRY_BLOCK_PTR_FOR_FN
3532                            (cfun)->count.apply_scale (threshold, 1);
3533   profile_count sum = profile_count::zero ();
3534   FOR_EACH_BB_FN (bb, cfun)
3535     {
3536       rtx_insn *insn;
3537
3538       if (!bb->count.initialized_p ())
3539         {
3540           if (dump_file)
3541             fprintf (dump_file, "Function is considered expensive because"
3542                      " count of bb %i is not initialized\n", bb->index);
3543           return true;
3544         }
3545
3546       FOR_BB_INSNS (bb, insn)
3547         if (active_insn_p (insn))
3548           {
3549             sum += bb->count;
3550             if (sum > limit)
3551               return true;
3552         }
3553     }
3554
3555   return false;
3556 }
3557
3558 /* All basic blocks that are reachable only from unlikely basic blocks are
3559    unlikely.  */
3560
3561 void
3562 propagate_unlikely_bbs_forward (void)
3563 {
3564   auto_vec<basic_block, 64> worklist;
3565   basic_block bb;
3566   edge_iterator ei;
3567   edge e;
3568
3569   if (!(ENTRY_BLOCK_PTR_FOR_FN (cfun)->count == profile_count::zero ()))
3570     {
3571       ENTRY_BLOCK_PTR_FOR_FN (cfun)->aux = (void *)(size_t) 1;
3572       worklist.safe_push (ENTRY_BLOCK_PTR_FOR_FN (cfun));
3573
3574       while (worklist.length () > 0)
3575         {
3576           bb = worklist.pop ();
3577           FOR_EACH_EDGE (e, ei, bb->succs)
3578             if (!(e->count () == profile_count::zero ())
3579                 && !(e->dest->count == profile_count::zero ())
3580                 && !e->dest->aux)
3581               {
3582                 e->dest->aux = (void *)(size_t) 1;
3583                 worklist.safe_push (e->dest);
3584               }
3585         }
3586     }
3587
3588   FOR_ALL_BB_FN (bb, cfun)
3589     {
3590       if (!bb->aux)
3591         {
3592           if (!(bb->count == profile_count::zero ())
3593               && (dump_file && (dump_flags & TDF_DETAILS)))
3594             fprintf (dump_file,
3595                      "Basic block %i is marked unlikely by forward prop\n",
3596                      bb->index);
3597           bb->count = profile_count::zero ();
3598         }
3599       else
3600         bb->aux = NULL;
3601     }
3602 }
3603
3604 /* Determine basic blocks/edges that are known to be unlikely executed and set
3605    their counters to zero.
3606    This is done with first identifying obviously unlikely BBs/edges and then
3607    propagating in both directions.  */
3608
3609 static void
3610 determine_unlikely_bbs ()
3611 {
3612   basic_block bb;
3613   auto_vec<basic_block, 64> worklist;
3614   edge_iterator ei;
3615   edge e;
3616
3617   FOR_EACH_BB_FN (bb, cfun)
3618     {
3619       if (!(bb->count == profile_count::zero ())
3620           && unlikely_executed_bb_p (bb))
3621         {
3622           if (dump_file && (dump_flags & TDF_DETAILS))
3623             fprintf (dump_file, "Basic block %i is locally unlikely\n",
3624                      bb->index);
3625           bb->count = profile_count::zero ();
3626         }
3627
3628       FOR_EACH_EDGE (e, ei, bb->succs)
3629         if (!(e->probability == profile_probability::never ())
3630             && unlikely_executed_edge_p (e))
3631           {
3632             if (dump_file && (dump_flags & TDF_DETAILS))
3633               fprintf (dump_file, "Edge %i->%i is locally unlikely\n",
3634                        bb->index, e->dest->index);
3635             e->probability = profile_probability::never ();
3636           }
3637
3638       gcc_checking_assert (!bb->aux);
3639     }
3640   propagate_unlikely_bbs_forward ();
3641
3642   auto_vec<int, 64> nsuccs;
3643   nsuccs.safe_grow_cleared (last_basic_block_for_fn (cfun));
3644   FOR_ALL_BB_FN (bb, cfun)
3645     if (!(bb->count == profile_count::zero ())
3646         && bb != EXIT_BLOCK_PTR_FOR_FN (cfun))
3647       {
3648         nsuccs[bb->index] = 0;
3649         FOR_EACH_EDGE (e, ei, bb->succs)
3650           if (!(e->probability == profile_probability::never ())
3651               && !(e->dest->count == profile_count::zero ()))
3652             nsuccs[bb->index]++;
3653         if (!nsuccs[bb->index])
3654           worklist.safe_push (bb);
3655       }
3656   while (worklist.length () > 0)
3657     {
3658       bb = worklist.pop ();
3659       if (bb->count == profile_count::zero ())
3660         continue;
3661       if (bb != ENTRY_BLOCK_PTR_FOR_FN (cfun))
3662         {
3663           bool found = false;
3664           for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
3665                !gsi_end_p (gsi); gsi_next (&gsi))
3666             if (stmt_can_terminate_bb_p (gsi_stmt (gsi))
3667                 /* stmt_can_terminate_bb_p special cases noreturns because it
3668                    assumes that fake edges are created.  We want to know that
3669                    noreturn alone does not imply BB to be unlikely.  */
3670                 || (is_gimple_call (gsi_stmt (gsi))
3671                     && (gimple_call_flags (gsi_stmt (gsi)) & ECF_NORETURN)))
3672               {
3673                 found = true;
3674                 break;
3675               }
3676           if (found)
3677             continue;
3678         }
3679       if (dump_file && (dump_flags & TDF_DETAILS))
3680         fprintf (dump_file,
3681                  "Basic block %i is marked unlikely by backward prop\n",
3682                  bb->index);
3683       bb->count = profile_count::zero ();
3684       FOR_EACH_EDGE (e, ei, bb->preds)
3685         if (!(e->probability == profile_probability::never ()))
3686           {
3687             if (!(e->src->count == profile_count::zero ()))
3688               {
3689                 gcc_checking_assert (nsuccs[e->src->index] > 0);
3690                 nsuccs[e->src->index]--;
3691                 if (!nsuccs[e->src->index])
3692                   worklist.safe_push (e->src);
3693               }
3694           }
3695     }
3696   /* Finally all edges from non-0 regions to 0 are unlikely.  */
3697   FOR_ALL_BB_FN (bb, cfun)
3698     if (!(bb->count == profile_count::zero ()))
3699       FOR_EACH_EDGE (e, ei, bb->succs)
3700         if (!(e->probability == profile_probability::never ())
3701             && e->dest->count == profile_count::zero ())
3702            {
3703              if (dump_file && (dump_flags & TDF_DETAILS))
3704                fprintf (dump_file, "Edge %i->%i is unlikely because "
3705                         "it enters unlikely block\n",
3706                         bb->index, e->dest->index);
3707              e->probability = profile_probability::never ();
3708            }
3709   if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->count == profile_count::zero ())
3710     cgraph_node::get (current_function_decl)->count = profile_count::zero ();
3711 }
3712
3713 /* Estimate and propagate basic block frequencies using the given branch
3714    probabilities.  If FORCE is true, the frequencies are used to estimate
3715    the counts even when there are already non-zero profile counts.  */
3716
3717 void
3718 estimate_bb_frequencies (bool force)
3719 {
3720   basic_block bb;
3721   sreal freq_max;
3722
3723   determine_unlikely_bbs ();
3724
3725   if (force || profile_status_for_fn (cfun) != PROFILE_READ
3726       || !update_max_bb_count ())
3727     {
3728       static int real_values_initialized = 0;
3729
3730       if (!real_values_initialized)
3731         {
3732           real_values_initialized = 1;
3733           real_br_prob_base = REG_BR_PROB_BASE;
3734           /* Scaling frequencies up to maximal profile count may result in
3735              frequent overflows especially when inlining loops.
3736              Small scalling results in unnecesary precision loss.  Stay in
3737              the half of the (exponential) range.  */
3738           real_bb_freq_max = (uint64_t)1 << (profile_count::n_bits / 2);
3739           real_one_half = sreal (1, -1);
3740           real_inv_br_prob_base = sreal (1) / real_br_prob_base;
3741           real_almost_one = sreal (1) - real_inv_br_prob_base;
3742         }
3743
3744       mark_dfs_back_edges ();
3745
3746       single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun))->probability =
3747          profile_probability::always ();
3748
3749       /* Set up block info for each basic block.  */
3750       alloc_aux_for_blocks (sizeof (block_info));
3751       alloc_aux_for_edges (sizeof (edge_prob_info));
3752       FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3753         {
3754           edge e;
3755           edge_iterator ei;
3756
3757           FOR_EACH_EDGE (e, ei, bb->succs)
3758             {
3759               /* FIXME: Graphite is producing edges with no profile. Once
3760                  this is fixed, drop this.  */
3761               if (e->probability.initialized_p ())
3762                 EDGE_INFO (e)->back_edge_prob
3763                    = e->probability.to_reg_br_prob_base ();
3764               else
3765                 EDGE_INFO (e)->back_edge_prob = REG_BR_PROB_BASE / 2;
3766               EDGE_INFO (e)->back_edge_prob *= real_inv_br_prob_base;
3767             }
3768         }
3769
3770       /* First compute frequencies locally for each loop from innermost
3771          to outermost to examine frequencies for back edges.  */
3772       estimate_loops ();
3773
3774       freq_max = 0;
3775       FOR_EACH_BB_FN (bb, cfun)
3776         if (freq_max < BLOCK_INFO (bb)->frequency)
3777           freq_max = BLOCK_INFO (bb)->frequency;
3778
3779       freq_max = real_bb_freq_max / freq_max;
3780       if (freq_max < 16)
3781         freq_max = 16;
3782       profile_count ipa_count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count.ipa ();
3783       cfun->cfg->count_max = profile_count::uninitialized ();
3784       FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3785         {
3786           sreal tmp = BLOCK_INFO (bb)->frequency * freq_max + real_one_half;
3787           profile_count count = profile_count::from_gcov_type (tmp.to_int ());
3788
3789           /* If we have profile feedback in which this function was never
3790              executed, then preserve this info.  */
3791           if (!(bb->count == profile_count::zero ()))
3792             bb->count = count.guessed_local ().combine_with_ipa_count (ipa_count);
3793           cfun->cfg->count_max = cfun->cfg->count_max.max (bb->count);
3794         }
3795
3796       free_aux_for_blocks ();
3797       free_aux_for_edges ();
3798     }
3799   compute_function_frequency ();
3800 }
3801
3802 /* Decide whether function is hot, cold or unlikely executed.  */
3803 void
3804 compute_function_frequency (void)
3805 {
3806   basic_block bb;
3807   struct cgraph_node *node = cgraph_node::get (current_function_decl);
3808
3809   if (DECL_STATIC_CONSTRUCTOR (current_function_decl)
3810       || MAIN_NAME_P (DECL_NAME (current_function_decl)))
3811     node->only_called_at_startup = true;
3812   if (DECL_STATIC_DESTRUCTOR (current_function_decl))
3813     node->only_called_at_exit = true;
3814
3815   if (profile_status_for_fn (cfun) != PROFILE_READ)
3816     {
3817       int flags = flags_from_decl_or_type (current_function_decl);
3818       if ((ENTRY_BLOCK_PTR_FOR_FN (cfun)->count.ipa_p ()
3819            && ENTRY_BLOCK_PTR_FOR_FN (cfun)->count.ipa() == profile_count::zero ())
3820           || lookup_attribute ("cold", DECL_ATTRIBUTES (current_function_decl))
3821              != NULL)
3822         {
3823           node->frequency = NODE_FREQUENCY_UNLIKELY_EXECUTED;
3824           warn_function_cold (current_function_decl);
3825         }
3826       else if (lookup_attribute ("hot", DECL_ATTRIBUTES (current_function_decl))
3827                != NULL)
3828         node->frequency = NODE_FREQUENCY_HOT;
3829       else if (flags & ECF_NORETURN)
3830         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3831       else if (MAIN_NAME_P (DECL_NAME (current_function_decl)))
3832         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3833       else if (DECL_STATIC_CONSTRUCTOR (current_function_decl)
3834                || DECL_STATIC_DESTRUCTOR (current_function_decl))
3835         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3836       return;
3837     }
3838
3839   node->frequency = NODE_FREQUENCY_UNLIKELY_EXECUTED;
3840   warn_function_cold (current_function_decl);
3841   if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->count.ipa() == profile_count::zero ())
3842     return;
3843   FOR_EACH_BB_FN (bb, cfun)
3844     {
3845       if (maybe_hot_bb_p (cfun, bb))
3846         {
3847           node->frequency = NODE_FREQUENCY_HOT;
3848           return;
3849         }
3850       if (!probably_never_executed_bb_p (cfun, bb))
3851         node->frequency = NODE_FREQUENCY_NORMAL;
3852     }
3853 }
3854
3855 /* Build PREDICT_EXPR.  */
3856 tree
3857 build_predict_expr (enum br_predictor predictor, enum prediction taken)
3858 {
3859   tree t = build1 (PREDICT_EXPR, void_type_node,
3860                    build_int_cst (integer_type_node, predictor));
3861   SET_PREDICT_EXPR_OUTCOME (t, taken);
3862   return t;
3863 }
3864
3865 const char *
3866 predictor_name (enum br_predictor predictor)
3867 {
3868   return predictor_info[predictor].name;
3869 }
3870
3871 /* Predict branch probabilities and estimate profile of the tree CFG. */
3872
3873 namespace {
3874
3875 const pass_data pass_data_profile =
3876 {
3877   GIMPLE_PASS, /* type */
3878   "profile_estimate", /* name */
3879   OPTGROUP_NONE, /* optinfo_flags */
3880   TV_BRANCH_PROB, /* tv_id */
3881   PROP_cfg, /* properties_required */
3882   0, /* properties_provided */
3883   0, /* properties_destroyed */
3884   0, /* todo_flags_start */
3885   0, /* todo_flags_finish */
3886 };
3887
3888 class pass_profile : public gimple_opt_pass
3889 {
3890 public:
3891   pass_profile (gcc::context *ctxt)
3892     : gimple_opt_pass (pass_data_profile, ctxt)
3893   {}
3894
3895   /* opt_pass methods: */
3896   virtual bool gate (function *) { return flag_guess_branch_prob; }
3897   virtual unsigned int execute (function *);
3898
3899 }; // class pass_profile
3900
3901 unsigned int
3902 pass_profile::execute (function *fun)
3903 {
3904   unsigned nb_loops;
3905
3906   if (profile_status_for_fn (cfun) == PROFILE_GUESSED)
3907     return 0;
3908
3909   loop_optimizer_init (LOOPS_NORMAL);
3910   if (dump_file && (dump_flags & TDF_DETAILS))
3911     flow_loops_dump (dump_file, NULL, 0);
3912
3913   mark_irreducible_loops ();
3914
3915   nb_loops = number_of_loops (fun);
3916   if (nb_loops > 1)
3917     scev_initialize ();
3918
3919   tree_estimate_probability (false);
3920
3921   if (nb_loops > 1)
3922     scev_finalize ();
3923
3924   loop_optimizer_finalize ();
3925   if (dump_file && (dump_flags & TDF_DETAILS))
3926     gimple_dump_cfg (dump_file, dump_flags);
3927  if (profile_status_for_fn (fun) == PROFILE_ABSENT)
3928     profile_status_for_fn (fun) = PROFILE_GUESSED;
3929  if (dump_file && (dump_flags & TDF_DETAILS))
3930    {
3931      struct loop *loop;
3932      FOR_EACH_LOOP (loop, LI_FROM_INNERMOST)
3933        if (loop->header->count.initialized_p ())
3934          fprintf (dump_file, "Loop got predicted %d to iterate %i times.\n",
3935            loop->num,
3936            (int)expected_loop_iterations_unbounded (loop));
3937    }
3938   return 0;
3939 }
3940
3941 } // anon namespace
3942
3943 gimple_opt_pass *
3944 make_pass_profile (gcc::context *ctxt)
3945 {
3946   return new pass_profile (ctxt);
3947 }
3948
3949 /* Return true when PRED predictor should be removed after early
3950    tree passes.  Most of the predictors are beneficial to survive
3951    as early inlining can also distribute then into caller's bodies.  */
3952
3953 static bool
3954 strip_predictor_early (enum br_predictor pred)
3955 {
3956   switch (pred)
3957     {
3958     case PRED_TREE_EARLY_RETURN:
3959       return true;
3960     default:
3961       return false;
3962     }
3963 }
3964
3965 /* Get rid of all builtin_expect calls and GIMPLE_PREDICT statements
3966    we no longer need.  EARLY is set to true when called from early
3967    optimizations.  */
3968
3969 unsigned int
3970 strip_predict_hints (function *fun, bool early)
3971 {
3972   basic_block bb;
3973   gimple *ass_stmt;
3974   tree var;
3975   bool changed = false;
3976
3977   FOR_EACH_BB_FN (bb, fun)
3978     {
3979       gimple_stmt_iterator bi;
3980       for (bi = gsi_start_bb (bb); !gsi_end_p (bi);)
3981         {
3982           gimple *stmt = gsi_stmt (bi);
3983
3984           if (gimple_code (stmt) == GIMPLE_PREDICT)
3985             {
3986               if (!early
3987                   || strip_predictor_early (gimple_predict_predictor (stmt)))
3988                 {
3989                   gsi_remove (&bi, true);
3990                   changed = true;
3991                   continue;
3992                 }
3993             }
3994           else if (is_gimple_call (stmt))
3995             {
3996               tree fndecl = gimple_call_fndecl (stmt);
3997
3998               if (!early
3999                   && ((DECL_BUILT_IN_P (fndecl, BUILT_IN_NORMAL, BUILT_IN_EXPECT)
4000                        && gimple_call_num_args (stmt) == 2)
4001                       || (DECL_BUILT_IN_P (fndecl, BUILT_IN_NORMAL,
4002                                            BUILT_IN_EXPECT_WITH_PROBABILITY)
4003                           && gimple_call_num_args (stmt) == 3)
4004                       || (gimple_call_internal_p (stmt)
4005                           && gimple_call_internal_fn (stmt) == IFN_BUILTIN_EXPECT)))
4006                 {
4007                   var = gimple_call_lhs (stmt);
4008                   changed = true;
4009                   if (var)
4010                     {
4011                       ass_stmt
4012                         = gimple_build_assign (var, gimple_call_arg (stmt, 0));
4013                       gsi_replace (&bi, ass_stmt, true);
4014                     }
4015                   else
4016                     {
4017                       gsi_remove (&bi, true);
4018                       continue;
4019                     }
4020                 }
4021             }
4022           gsi_next (&bi);
4023         }
4024     }
4025   return changed ? TODO_cleanup_cfg : 0;
4026 }
4027
4028 namespace {
4029
4030 const pass_data pass_data_strip_predict_hints =
4031 {
4032   GIMPLE_PASS, /* type */
4033   "*strip_predict_hints", /* name */
4034   OPTGROUP_NONE, /* optinfo_flags */
4035   TV_BRANCH_PROB, /* tv_id */
4036   PROP_cfg, /* properties_required */
4037   0, /* properties_provided */
4038   0, /* properties_destroyed */
4039   0, /* todo_flags_start */
4040   0, /* todo_flags_finish */
4041 };
4042
4043 class pass_strip_predict_hints : public gimple_opt_pass
4044 {
4045 public:
4046   pass_strip_predict_hints (gcc::context *ctxt)
4047     : gimple_opt_pass (pass_data_strip_predict_hints, ctxt)
4048   {}
4049
4050   /* opt_pass methods: */
4051   opt_pass * clone () { return new pass_strip_predict_hints (m_ctxt); }
4052   void set_pass_param (unsigned int n, bool param)
4053     {
4054       gcc_assert (n == 0);
4055       early_p = param;
4056     }
4057
4058   virtual unsigned int execute (function *);
4059
4060 private:
4061   bool early_p;
4062
4063 }; // class pass_strip_predict_hints
4064
4065 unsigned int
4066 pass_strip_predict_hints::execute (function *fun)
4067 {
4068   return strip_predict_hints (fun, early_p);
4069 }
4070
4071 } // anon namespace
4072
4073 gimple_opt_pass *
4074 make_pass_strip_predict_hints (gcc::context *ctxt)
4075 {
4076   return new pass_strip_predict_hints (ctxt);
4077 }
4078
4079 /* Rebuild function frequencies.  Passes are in general expected to
4080    maintain profile by hand, however in some cases this is not possible:
4081    for example when inlining several functions with loops freuqencies might run
4082    out of scale and thus needs to be recomputed.  */
4083
4084 void
4085 rebuild_frequencies (void)
4086 {
4087   timevar_push (TV_REBUILD_FREQUENCIES);
4088
4089   /* When the max bb count in the function is small, there is a higher
4090      chance that there were truncation errors in the integer scaling
4091      of counts by inlining and other optimizations. This could lead
4092      to incorrect classification of code as being cold when it isn't.
4093      In that case, force the estimation of bb counts/frequencies from the
4094      branch probabilities, rather than computing frequencies from counts,
4095      which may also lead to frequencies incorrectly reduced to 0. There
4096      is less precision in the probabilities, so we only do this for small
4097      max counts.  */
4098   cfun->cfg->count_max = profile_count::uninitialized ();
4099   basic_block bb;
4100   FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
4101     cfun->cfg->count_max = cfun->cfg->count_max.max (bb->count);
4102
4103   if (profile_status_for_fn (cfun) == PROFILE_GUESSED)
4104     {
4105       loop_optimizer_init (0);
4106       add_noreturn_fake_exit_edges ();
4107       mark_irreducible_loops ();
4108       connect_infinite_loops_to_exit ();
4109       estimate_bb_frequencies (true);
4110       remove_fake_exit_edges ();
4111       loop_optimizer_finalize ();
4112     }
4113   else if (profile_status_for_fn (cfun) == PROFILE_READ)
4114     update_max_bb_count ();
4115   else if (profile_status_for_fn (cfun) == PROFILE_ABSENT
4116            && !flag_guess_branch_prob)
4117     ;
4118   else
4119     gcc_unreachable ();
4120   timevar_pop (TV_REBUILD_FREQUENCIES);
4121 }
4122
4123 /* Perform a dry run of the branch prediction pass and report comparsion of
4124    the predicted and real profile into the dump file.  */
4125
4126 void
4127 report_predictor_hitrates (void)
4128 {
4129   unsigned nb_loops;
4130
4131   loop_optimizer_init (LOOPS_NORMAL);
4132   if (dump_file && (dump_flags & TDF_DETAILS))
4133     flow_loops_dump (dump_file, NULL, 0);
4134
4135   mark_irreducible_loops ();
4136
4137   nb_loops = number_of_loops (cfun);
4138   if (nb_loops > 1)
4139     scev_initialize ();
4140
4141   tree_estimate_probability (true);
4142
4143   if (nb_loops > 1)
4144     scev_finalize ();
4145
4146   loop_optimizer_finalize ();
4147 }
4148
4149 /* Force edge E to be cold.
4150    If IMPOSSIBLE is true, for edge to have count and probability 0 otherwise
4151    keep low probability to represent possible error in a guess.  This is used
4152    i.e. in case we predict loop to likely iterate given number of times but
4153    we are not 100% sure.
4154
4155    This function locally updates profile without attempt to keep global
4156    consistency which can not be reached in full generality without full profile
4157    rebuild from probabilities alone.  Doing so is not necessarily a good idea
4158    because frequencies and counts may be more realistic then probabilities.
4159
4160    In some cases (such as for elimination of early exits during full loop
4161    unrolling) the caller can ensure that profile will get consistent
4162    afterwards.  */
4163
4164 void
4165 force_edge_cold (edge e, bool impossible)
4166 {
4167   profile_count count_sum = profile_count::zero ();
4168   profile_probability prob_sum = profile_probability::never ();
4169   edge_iterator ei;
4170   edge e2;
4171   bool uninitialized_exit = false;
4172
4173   /* When branch probability guesses are not known, then do nothing.  */
4174   if (!impossible && !e->count ().initialized_p ())
4175     return;
4176
4177   profile_probability goal = (impossible ? profile_probability::never ()
4178                               : profile_probability::very_unlikely ());
4179
4180   /* If edge is already improbably or cold, just return.  */
4181   if (e->probability <= goal
4182       && (!impossible || e->count () == profile_count::zero ()))
4183     return;
4184   FOR_EACH_EDGE (e2, ei, e->src->succs)
4185     if (e2 != e)
4186       {
4187         if (e->flags & EDGE_FAKE)
4188           continue;
4189         if (e2->count ().initialized_p ())
4190           count_sum += e2->count ();
4191         if (e2->probability.initialized_p ())
4192           prob_sum += e2->probability;
4193         else
4194           uninitialized_exit = true;
4195       }
4196
4197   /* If we are not guessing profiles but have some other edges out,
4198      just assume the control flow goes elsewhere.  */
4199   if (uninitialized_exit)
4200     e->probability = goal;
4201   /* If there are other edges out of e->src, redistribute probabilitity
4202      there.  */
4203   else if (prob_sum > profile_probability::never ())
4204     {
4205       if (!(e->probability < goal))
4206         e->probability = goal;
4207
4208       profile_probability prob_comp = prob_sum / e->probability.invert ();
4209
4210       if (dump_file && (dump_flags & TDF_DETAILS))
4211         fprintf (dump_file, "Making edge %i->%i %s by redistributing "
4212                  "probability to other edges.\n",
4213                  e->src->index, e->dest->index,
4214                  impossible ? "impossible" : "cold");
4215       FOR_EACH_EDGE (e2, ei, e->src->succs)
4216         if (e2 != e)
4217           {
4218             e2->probability /= prob_comp;
4219           }
4220       if (current_ir_type () != IR_GIMPLE
4221           && e->src != ENTRY_BLOCK_PTR_FOR_FN (cfun))
4222         update_br_prob_note (e->src);
4223     }
4224   /* If all edges out of e->src are unlikely, the basic block itself
4225      is unlikely.  */
4226   else
4227     {
4228       if (prob_sum == profile_probability::never ())
4229         e->probability = profile_probability::always ();
4230       else
4231         {
4232           if (impossible)
4233             e->probability = profile_probability::never ();
4234           /* If BB has some edges out that are not impossible, we can not
4235              assume that BB itself is.  */
4236           impossible = false;
4237         }
4238       if (current_ir_type () != IR_GIMPLE
4239           && e->src != ENTRY_BLOCK_PTR_FOR_FN (cfun))
4240         update_br_prob_note (e->src);
4241       if (e->src->count == profile_count::zero ())
4242         return;
4243       if (count_sum == profile_count::zero () && impossible)
4244         {
4245           bool found = false;
4246           if (e->src == ENTRY_BLOCK_PTR_FOR_FN (cfun))
4247             ;
4248           else if (current_ir_type () == IR_GIMPLE)
4249             for (gimple_stmt_iterator gsi = gsi_start_bb (e->src);
4250                  !gsi_end_p (gsi); gsi_next (&gsi))
4251               {
4252                 if (stmt_can_terminate_bb_p (gsi_stmt (gsi)))
4253                   {
4254                     found = true;
4255                     break;
4256                   }
4257               }
4258           /* FIXME: Implement RTL path.  */
4259           else
4260             found = true;
4261           if (!found)
4262             {
4263               if (dump_file && (dump_flags & TDF_DETAILS))
4264                 fprintf (dump_file,
4265                          "Making bb %i impossible and dropping count to 0.\n",
4266                          e->src->index);
4267               e->src->count = profile_count::zero ();
4268               FOR_EACH_EDGE (e2, ei, e->src->preds)
4269                 force_edge_cold (e2, impossible);
4270               return;
4271             }
4272         }
4273
4274       /* If we did not adjusting, the source basic block has no likely edeges
4275          leaving other direction. In that case force that bb cold, too.
4276          This in general is difficult task to do, but handle special case when
4277          BB has only one predecestor.  This is common case when we are updating
4278          after loop transforms.  */
4279       if (!(prob_sum > profile_probability::never ())
4280           && count_sum == profile_count::zero ()
4281           && single_pred_p (e->src) && e->src->count.to_frequency (cfun)
4282              > (impossible ? 0 : 1))
4283         {
4284           int old_frequency = e->src->count.to_frequency (cfun);
4285           if (dump_file && (dump_flags & TDF_DETAILS))
4286             fprintf (dump_file, "Making bb %i %s.\n", e->src->index,
4287                      impossible ? "impossible" : "cold");
4288           int new_frequency = MIN (e->src->count.to_frequency (cfun),
4289                                    impossible ? 0 : 1);
4290           if (impossible)
4291             e->src->count = profile_count::zero ();
4292           else
4293             e->src->count = e->count ().apply_scale (new_frequency,
4294                                                      old_frequency);
4295           force_edge_cold (single_pred_edge (e->src), impossible);
4296         }
4297       else if (dump_file && (dump_flags & TDF_DETAILS)
4298                && maybe_hot_bb_p (cfun, e->src))
4299         fprintf (dump_file, "Giving up on making bb %i %s.\n", e->src->index,
4300                  impossible ? "impossible" : "cold");
4301     }
4302 }
4303
4304 #if CHECKING_P
4305
4306 namespace selftest {
4307
4308 /* Test that value range of predictor values defined in predict.def is
4309    within range (50, 100].  */
4310
4311 struct branch_predictor
4312 {
4313   const char *name;
4314   int probability;
4315 };
4316
4317 #define DEF_PREDICTOR(ENUM, NAME, HITRATE, FLAGS) { NAME, HITRATE },
4318
4319 static void
4320 test_prediction_value_range ()
4321 {
4322   branch_predictor predictors[] = {
4323 #include "predict.def"
4324     { NULL, PROB_UNINITIALIZED }
4325   };
4326
4327   for (unsigned i = 0; predictors[i].name != NULL; i++)
4328     {
4329       if (predictors[i].probability == PROB_UNINITIALIZED)
4330         continue;
4331
4332       unsigned p = 100 * predictors[i].probability / REG_BR_PROB_BASE;
4333       ASSERT_TRUE (p >= 50 && p <= 100);
4334     }
4335 }
4336
4337 #undef DEF_PREDICTOR
4338
4339 /* Run all of the selfests within this file.  */
4340
4341 void
4342 predict_c_tests ()
4343 {
4344   test_prediction_value_range ();
4345 }
4346
4347 } // namespace selftest
4348 #endif /* CHECKING_P.  */