gcc/predict.c

   1 /* Branch prediction routines for the GNU compiler.
   2    Copyright (C) 2000-2017 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 /* References:
  21
  22    [1] "Branch Prediction for Free"
  23        Ball and Larus; PLDI '93.
  24    [2] "Static Branch Frequency and Program Profile Analysis"
  25        Wu and Larus; MICRO-27.
  26    [3] "Corpus-based Static Branch Prediction"
  27        Calder, Grunwald, Lindsay, Martin, Mozer, and Zorn; PLDI '95.  */
  28
  29
  30 #include "config.h"
  31 #include "system.h"
  32 #include "coretypes.h"
  33 #include "backend.h"
  34 #include "rtl.h"
  35 #include "tree.h"
  36 #include "gimple.h"
  37 #include "cfghooks.h"
  38 #include "tree-pass.h"
  39 #include "ssa.h"
  40 #include "memmodel.h"
  41 #include "emit-rtl.h"
  42 #include "cgraph.h"
  43 #include "coverage.h"
  44 #include "diagnostic-core.h"
  45 #include "gimple-predict.h"
  46 #include "fold-const.h"
  47 #include "calls.h"
  48 #include "cfganal.h"
  49 #include "profile.h"
  50 #include "sreal.h"
  51 #include "params.h"
  52 #include "cfgloop.h"
  53 #include "gimple-iterator.h"
  54 #include "tree-cfg.h"
  55 #include "tree-ssa-loop-niter.h"
  56 #include "tree-ssa-loop.h"
  57 #include "tree-scalar-evolution.h"
  58 #include "ipa-utils.h"
  59 #include "gimple-pretty-print.h"
  60 #include "selftest.h"
  61 #include "cfgrtl.h"
  62
  63 /* Enum with reasons why a predictor is ignored.  */
  64
  65 enum predictor_reason
  66 {
  67   REASON_NONE,
  68   REASON_IGNORED,
  69   REASON_SINGLE_EDGE_DUPLICATE,
  70   REASON_EDGE_PAIR_DUPLICATE
  71 };
  72
  73 /* String messages for the aforementioned enum.  */
  74
  75 static const char *reason_messages[] = {"", " (ignored)",
  76     " (single edge duplicate)", " (edge pair duplicate)"};
  77
  78 /* real constants: 0, 1, 1-1/REG_BR_PROB_BASE, REG_BR_PROB_BASE,
  79                    1/REG_BR_PROB_BASE, 0.5, BB_FREQ_MAX.  */
  80 static sreal real_almost_one, real_br_prob_base,
  81              real_inv_br_prob_base, real_one_half, real_bb_freq_max;
  82
  83 static void combine_predictions_for_insn (rtx_insn *, basic_block);
  84 static void dump_prediction (FILE *, enum br_predictor, int, basic_block,
  85                              enum predictor_reason, edge);
  86 static void predict_paths_leading_to (basic_block, enum br_predictor,
  87                                       enum prediction,
  88                                       struct loop *in_loop = NULL);
  89 static void predict_paths_leading_to_edge (edge, enum br_predictor,
  90                                            enum prediction,
  91                                            struct loop *in_loop = NULL);
  92 static bool can_predict_insn_p (const rtx_insn *);
  93
  94 /* Information we hold about each branch predictor.
  95    Filled using information from predict.def.  */
  96
  97 struct predictor_info
  98 {
  99   const char *const name;       /* Name used in the debugging dumps.  */
 100   const int hitrate;            /* Expected hitrate used by
 101                                    predict_insn_def call.  */
 102   const int flags;
 103 };
 104
 105 /* Use given predictor without Dempster-Shaffer theory if it matches
 106    using first_match heuristics.  */
 107 #define PRED_FLAG_FIRST_MATCH 1
 108
 109 /* Recompute hitrate in percent to our representation.  */
 110
 111 #define HITRATE(VAL) ((int) ((VAL) * REG_BR_PROB_BASE + 50) / 100)
 112
 113 #define DEF_PREDICTOR(ENUM, NAME, HITRATE, FLAGS) {NAME, HITRATE, FLAGS},
 114 static const struct predictor_info predictor_info[]= {
 115 #include "predict.def"
 116
 117   /* Upper bound on predictors.  */
 118   {NULL, 0, 0}
 119 };
 120 #undef DEF_PREDICTOR
 121
 122 /* Return TRUE if frequency FREQ is considered to be hot.  */
 123
 124 static inline bool
 125 maybe_hot_frequency_p (struct function *fun, int freq)
 126 {
 127   struct cgraph_node *node = cgraph_node::get (fun->decl);
 128   if (!profile_info || profile_status_for_fn (fun) != PROFILE_READ)
 129     {
 130       if (node->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED)
 131         return false;
 132       if (node->frequency == NODE_FREQUENCY_HOT)
 133         return true;
 134     }
 135   if (profile_status_for_fn (fun) == PROFILE_ABSENT)
 136     return true;
 137   if (node->frequency == NODE_FREQUENCY_EXECUTED_ONCE
 138       && freq < (ENTRY_BLOCK_PTR_FOR_FN (fun)->frequency * 2 / 3))
 139     return false;
 140   if (PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION) == 0)
 141     return false;
 142   if (freq * PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION)
 143       < ENTRY_BLOCK_PTR_FOR_FN (fun)->frequency)
 144     return false;
 145   return true;
 146 }
 147
 148 static gcov_type min_count = -1;
 149
 150 /* Determine the threshold for hot BB counts.  */
 151
 152 gcov_type
 153 get_hot_bb_threshold ()
 154 {
 155   gcov_working_set_t *ws;
 156   if (min_count == -1)
 157     {
 158       ws = find_working_set (PARAM_VALUE (HOT_BB_COUNT_WS_PERMILLE));
 159       gcc_assert (ws);
 160       min_count = ws->min_counter;
 161     }
 162   return min_count;
 163 }
 164
 165 /* Set the threshold for hot BB counts.  */
 166
 167 void
 168 set_hot_bb_threshold (gcov_type min)
 169 {
 170   min_count = min;
 171 }
 172
 173 /* Return TRUE if frequency FREQ is considered to be hot.  */
 174
 175 bool
 176 maybe_hot_count_p (struct function *, profile_count count)
 177 {
 178   if (!count.initialized_p ())
 179     return true;
 180   /* Code executed at most once is not hot.  */
 181   if (count <= MAX (profile_info ? profile_info->runs : 1, 1))
 182     return false;
 183   return (count.to_gcov_type () >= get_hot_bb_threshold ());
 184 }
 185
 186 /* Return true in case BB can be CPU intensive and should be optimized
 187    for maximal performance.  */
 188
 189 bool
 190 maybe_hot_bb_p (struct function *fun, const_basic_block bb)
 191 {
 192   gcc_checking_assert (fun);
 193   if (!maybe_hot_count_p (fun, bb->count))
 194     return false;
 195   return maybe_hot_frequency_p (fun, bb->frequency);
 196 }
 197
 198 /* Return true in case BB can be CPU intensive and should be optimized
 199    for maximal performance.  */
 200
 201 bool
 202 maybe_hot_edge_p (edge e)
 203 {
 204   if (!maybe_hot_count_p (cfun, e->count))
 205     return false;
 206   return maybe_hot_frequency_p (cfun, EDGE_FREQUENCY (e));
 207 }
 208
 209 /* Return true if profile COUNT and FREQUENCY, or function FUN static
 210    node frequency reflects never being executed.  */
 211
 212 static bool
 213 probably_never_executed (struct function *fun,
 214                          profile_count count, int)
 215 {
 216   gcc_checking_assert (fun);
 217   if (count == profile_count::zero ())
 218     return true;
 219   if (count.initialized_p () && profile_status_for_fn (fun) == PROFILE_READ)
 220     {
 221       int unlikely_count_fraction = PARAM_VALUE (UNLIKELY_BB_COUNT_FRACTION);
 222       if (count.apply_scale (unlikely_count_fraction, 1) >= profile_info->runs)
 223         return false;
 224       return true;
 225     }
 226   if ((!profile_info || profile_status_for_fn (fun) != PROFILE_READ)
 227       && (cgraph_node::get (fun->decl)->frequency
 228           == NODE_FREQUENCY_UNLIKELY_EXECUTED))
 229     return true;
 230   return false;
 231 }
 232
 233
 234 /* Return true in case BB is probably never executed.  */
 235
 236 bool
 237 probably_never_executed_bb_p (struct function *fun, const_basic_block bb)
 238 {
 239   return probably_never_executed (fun, bb->count, bb->frequency);
 240 }
 241
 242
 243 /* Return true if E is unlikely executed for obvious reasons.  */
 244
 245 static bool
 246 unlikely_executed_edge_p (edge e)
 247 {
 248   return (e->count == profile_count::zero ()
 249           || e->probability == profile_probability::never ())
 250          || (e->flags & (EDGE_EH | EDGE_FAKE));
 251 }
 252
 253 /* Return true in case edge E is probably never executed.  */
 254
 255 bool
 256 probably_never_executed_edge_p (struct function *fun, edge e)
 257 {
 258   if (unlikely_executed_edge_p (e))
 259     return true;
 260   return probably_never_executed (fun, e->count, EDGE_FREQUENCY (e));
 261 }
 262
 263 /* Return true when current function should always be optimized for size.  */
 264
 265 bool
 266 optimize_function_for_size_p (struct function *fun)
 267 {
 268   if (!fun || !fun->decl)
 269     return optimize_size;
 270   cgraph_node *n = cgraph_node::get (fun->decl);
 271   return n && n->optimize_for_size_p ();
 272 }
 273
 274 /* Return true when current function should always be optimized for speed.  */
 275
 276 bool
 277 optimize_function_for_speed_p (struct function *fun)
 278 {
 279   return !optimize_function_for_size_p (fun);
 280 }
 281
 282 /* Return the optimization type that should be used for the function FUN.  */
 283
 284 optimization_type
 285 function_optimization_type (struct function *fun)
 286 {
 287   return (optimize_function_for_speed_p (fun)
 288           ? OPTIMIZE_FOR_SPEED
 289           : OPTIMIZE_FOR_SIZE);
 290 }
 291
 292 /* Return TRUE when BB should be optimized for size.  */
 293
 294 bool
 295 optimize_bb_for_size_p (const_basic_block bb)
 296 {
 297   return (optimize_function_for_size_p (cfun)
 298           || (bb && !maybe_hot_bb_p (cfun, bb)));
 299 }
 300
 301 /* Return TRUE when BB should be optimized for speed.  */
 302
 303 bool
 304 optimize_bb_for_speed_p (const_basic_block bb)
 305 {
 306   return !optimize_bb_for_size_p (bb);
 307 }
 308
 309 /* Return the optimization type that should be used for block BB.  */
 310
 311 optimization_type
 312 bb_optimization_type (const_basic_block bb)
 313 {
 314   return (optimize_bb_for_speed_p (bb)
 315           ? OPTIMIZE_FOR_SPEED
 316           : OPTIMIZE_FOR_SIZE);
 317 }
 318
 319 /* Return TRUE when BB should be optimized for size.  */
 320
 321 bool
 322 optimize_edge_for_size_p (edge e)
 323 {
 324   return optimize_function_for_size_p (cfun) || !maybe_hot_edge_p (e);
 325 }
 326
 327 /* Return TRUE when BB should be optimized for speed.  */
 328
 329 bool
 330 optimize_edge_for_speed_p (edge e)
 331 {
 332   return !optimize_edge_for_size_p (e);
 333 }
 334
 335 /* Return TRUE when BB should be optimized for size.  */
 336
 337 bool
 338 optimize_insn_for_size_p (void)
 339 {
 340   return optimize_function_for_size_p (cfun) || !crtl->maybe_hot_insn_p;
 341 }
 342
 343 /* Return TRUE when BB should be optimized for speed.  */
 344
 345 bool
 346 optimize_insn_for_speed_p (void)
 347 {
 348   return !optimize_insn_for_size_p ();
 349 }
 350
 351 /* Return TRUE when LOOP should be optimized for size.  */
 352
 353 bool
 354 optimize_loop_for_size_p (struct loop *loop)
 355 {
 356   return optimize_bb_for_size_p (loop->header);
 357 }
 358
 359 /* Return TRUE when LOOP should be optimized for speed.  */
 360
 361 bool
 362 optimize_loop_for_speed_p (struct loop *loop)
 363 {
 364   return optimize_bb_for_speed_p (loop->header);
 365 }
 366
 367 /* Return TRUE when LOOP nest should be optimized for speed.  */
 368
 369 bool
 370 optimize_loop_nest_for_speed_p (struct loop *loop)
 371 {
 372   struct loop *l = loop;
 373   if (optimize_loop_for_speed_p (loop))
 374     return true;
 375   l = loop->inner;
 376   while (l && l != loop)
 377     {
 378       if (optimize_loop_for_speed_p (l))
 379         return true;
 380       if (l->inner)
 381         l = l->inner;
 382       else if (l->next)
 383         l = l->next;
 384       else
 385         {
 386           while (l != loop && !l->next)
 387             l = loop_outer (l);
 388           if (l != loop)
 389             l = l->next;
 390         }
 391     }
 392   return false;
 393 }
 394
 395 /* Return TRUE when LOOP nest should be optimized for size.  */
 396
 397 bool
 398 optimize_loop_nest_for_size_p (struct loop *loop)
 399 {
 400   return !optimize_loop_nest_for_speed_p (loop);
 401 }
 402
 403 /* Return true when edge E is likely to be well predictable by branch
 404    predictor.  */
 405
 406 bool
 407 predictable_edge_p (edge e)
 408 {
 409   if (!e->probability.initialized_p ())
 410     return false;
 411   if ((e->probability.to_reg_br_prob_base ()
 412        <= PARAM_VALUE (PARAM_PREDICTABLE_BRANCH_OUTCOME) * REG_BR_PROB_BASE / 100)
 413       || (REG_BR_PROB_BASE - e->probability.to_reg_br_prob_base ()
 414           <= PARAM_VALUE (PARAM_PREDICTABLE_BRANCH_OUTCOME) * REG_BR_PROB_BASE / 100))
 415     return true;
 416   return false;
 417 }
 418
 419
 420 /* Set RTL expansion for BB profile.  */
 421
 422 void
 423 rtl_profile_for_bb (basic_block bb)
 424 {
 425   crtl->maybe_hot_insn_p = maybe_hot_bb_p (cfun, bb);
 426 }
 427
 428 /* Set RTL expansion for edge profile.  */
 429
 430 void
 431 rtl_profile_for_edge (edge e)
 432 {
 433   crtl->maybe_hot_insn_p = maybe_hot_edge_p (e);
 434 }
 435
 436 /* Set RTL expansion to default mode (i.e. when profile info is not known).  */
 437 void
 438 default_rtl_profile (void)
 439 {
 440   crtl->maybe_hot_insn_p = true;
 441 }
 442
 443 /* Return true if the one of outgoing edges is already predicted by
 444    PREDICTOR.  */
 445
 446 bool
 447 rtl_predicted_by_p (const_basic_block bb, enum br_predictor predictor)
 448 {
 449   rtx note;
 450   if (!INSN_P (BB_END (bb)))
 451     return false;
 452   for (note = REG_NOTES (BB_END (bb)); note; note = XEXP (note, 1))
 453     if (REG_NOTE_KIND (note) == REG_BR_PRED
 454         && INTVAL (XEXP (XEXP (note, 0), 0)) == (int)predictor)
 455       return true;
 456   return false;
 457 }
 458
 459 /*  Structure representing predictions in tree level. */
 460
 461 struct edge_prediction {
 462     struct edge_prediction *ep_next;
 463     edge ep_edge;
 464     enum br_predictor ep_predictor;
 465     int ep_probability;
 466 };
 467
 468 /* This map contains for a basic block the list of predictions for the
 469    outgoing edges.  */
 470
 471 static hash_map<const_basic_block, edge_prediction *> *bb_predictions;
 472
 473 /* Return true if the one of outgoing edges is already predicted by
 474    PREDICTOR.  */
 475
 476 bool
 477 gimple_predicted_by_p (const_basic_block bb, enum br_predictor predictor)
 478 {
 479   struct edge_prediction *i;
 480   edge_prediction **preds = bb_predictions->get (bb);
 481
 482   if (!preds)
 483     return false;
 484
 485   for (i = *preds; i; i = i->ep_next)
 486     if (i->ep_predictor == predictor)
 487       return true;
 488   return false;
 489 }
 490
 491 /* Return true if the one of outgoing edges is already predicted by
 492    PREDICTOR for edge E predicted as TAKEN.  */
 493
 494 bool
 495 edge_predicted_by_p (edge e, enum br_predictor predictor, bool taken)
 496 {
 497   struct edge_prediction *i;
 498   basic_block bb = e->src;
 499   edge_prediction **preds = bb_predictions->get (bb);
 500   if (!preds)
 501     return false;
 502
 503   int probability = predictor_info[(int) predictor].hitrate;
 504
 505   if (taken != TAKEN)
 506     probability = REG_BR_PROB_BASE - probability;
 507
 508   for (i = *preds; i; i = i->ep_next)
 509     if (i->ep_predictor == predictor
 510         && i->ep_edge == e
 511         && i->ep_probability == probability)
 512       return true;
 513   return false;
 514 }
 515
 516 /* Same predicate as above, working on edges.  */
 517 bool
 518 edge_probability_reliable_p (const_edge e)
 519 {
 520   return e->probability.probably_reliable_p ();
 521 }
 522
 523 /* Same predicate as edge_probability_reliable_p, working on notes.  */
 524 bool
 525 br_prob_note_reliable_p (const_rtx note)
 526 {
 527   gcc_assert (REG_NOTE_KIND (note) == REG_BR_PROB);
 528   return profile_probability::from_reg_br_prob_note
 529                  (XINT (note, 0)).probably_reliable_p ();
 530 }
 531
 532 static void
 533 predict_insn (rtx_insn *insn, enum br_predictor predictor, int probability)
 534 {
 535   gcc_assert (any_condjump_p (insn));
 536   if (!flag_guess_branch_prob)
 537     return;
 538
 539   add_reg_note (insn, REG_BR_PRED,
 540                 gen_rtx_CONCAT (VOIDmode,
 541                                 GEN_INT ((int) predictor),
 542                                 GEN_INT ((int) probability)));
 543 }
 544
 545 /* Predict insn by given predictor.  */
 546
 547 void
 548 predict_insn_def (rtx_insn *insn, enum br_predictor predictor,
 549                   enum prediction taken)
 550 {
 551    int probability = predictor_info[(int) predictor].hitrate;
 552
 553    if (taken != TAKEN)
 554      probability = REG_BR_PROB_BASE - probability;
 555
 556    predict_insn (insn, predictor, probability);
 557 }
 558
 559 /* Predict edge E with given probability if possible.  */
 560
 561 void
 562 rtl_predict_edge (edge e, enum br_predictor predictor, int probability)
 563 {
 564   rtx_insn *last_insn;
 565   last_insn = BB_END (e->src);
 566
 567   /* We can store the branch prediction information only about
 568      conditional jumps.  */
 569   if (!any_condjump_p (last_insn))
 570     return;
 571
 572   /* We always store probability of branching.  */
 573   if (e->flags & EDGE_FALLTHRU)
 574     probability = REG_BR_PROB_BASE - probability;
 575
 576   predict_insn (last_insn, predictor, probability);
 577 }
 578
 579 /* Predict edge E with the given PROBABILITY.  */
 580 void
 581 gimple_predict_edge (edge e, enum br_predictor predictor, int probability)
 582 {
 583   if (e->src != ENTRY_BLOCK_PTR_FOR_FN (cfun)
 584       && EDGE_COUNT (e->src->succs) > 1
 585       && flag_guess_branch_prob
 586       && optimize)
 587     {
 588       struct edge_prediction *i = XNEW (struct edge_prediction);
 589       edge_prediction *&preds = bb_predictions->get_or_insert (e->src);
 590
 591       i->ep_next = preds;
 592       preds = i;
 593       i->ep_probability = probability;
 594       i->ep_predictor = predictor;
 595       i->ep_edge = e;
 596     }
 597 }
 598
 599 /* Filter edge predictions PREDS by a function FILTER.  DATA are passed
 600    to the filter function.  */
 601
 602 void
 603 filter_predictions (edge_prediction **preds,
 604                     bool (*filter) (edge_prediction *, void *), void *data)
 605 {
 606   if (!bb_predictions)
 607     return;
 608
 609   if (preds)
 610     {
 611       struct edge_prediction **prediction = preds;
 612       struct edge_prediction *next;
 613
 614       while (*prediction)
 615         {
 616           if ((*filter) (*prediction, data))
 617             prediction = &((*prediction)->ep_next);
 618           else
 619             {
 620               next = (*prediction)->ep_next;
 621               free (*prediction);
 622               *prediction = next;
 623             }
 624         }
 625     }
 626 }
 627
 628 /* Filter function predicate that returns true for a edge predicate P
 629    if its edge is equal to DATA.  */
 630
 631 bool
 632 equal_edge_p (edge_prediction *p, void *data)
 633 {
 634   return p->ep_edge == (edge)data;
 635 }
 636
 637 /* Remove all predictions on given basic block that are attached
 638    to edge E.  */
 639 void
 640 remove_predictions_associated_with_edge (edge e)
 641 {
 642   if (!bb_predictions)
 643     return;
 644
 645   edge_prediction **preds = bb_predictions->get (e->src);
 646   filter_predictions (preds, equal_edge_p, e);
 647 }
 648
 649 /* Clears the list of predictions stored for BB.  */
 650
 651 static void
 652 clear_bb_predictions (basic_block bb)
 653 {
 654   edge_prediction **preds = bb_predictions->get (bb);
 655   struct edge_prediction *pred, *next;
 656
 657   if (!preds)
 658     return;
 659
 660   for (pred = *preds; pred; pred = next)
 661     {
 662       next = pred->ep_next;
 663       free (pred);
 664     }
 665   *preds = NULL;
 666 }
 667
 668 /* Return true when we can store prediction on insn INSN.
 669    At the moment we represent predictions only on conditional
 670    jumps, not at computed jump or other complicated cases.  */
 671 static bool
 672 can_predict_insn_p (const rtx_insn *insn)
 673 {
 674   return (JUMP_P (insn)
 675           && any_condjump_p (insn)
 676           && EDGE_COUNT (BLOCK_FOR_INSN (insn)->succs) >= 2);
 677 }
 678
 679 /* Predict edge E by given predictor if possible.  */
 680
 681 void
 682 predict_edge_def (edge e, enum br_predictor predictor,
 683                   enum prediction taken)
 684 {
 685    int probability = predictor_info[(int) predictor].hitrate;
 686
 687    if (taken != TAKEN)
 688      probability = REG_BR_PROB_BASE - probability;
 689
 690    predict_edge (e, predictor, probability);
 691 }
 692
 693 /* Invert all branch predictions or probability notes in the INSN.  This needs
 694    to be done each time we invert the condition used by the jump.  */
 695
 696 void
 697 invert_br_probabilities (rtx insn)
 698 {
 699   rtx note;
 700
 701   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
 702     if (REG_NOTE_KIND (note) == REG_BR_PROB)
 703       XINT (note, 0) = profile_probability::from_reg_br_prob_note
 704                          (XINT (note, 0)).invert ().to_reg_br_prob_note ();
 705     else if (REG_NOTE_KIND (note) == REG_BR_PRED)
 706       XEXP (XEXP (note, 0), 1)
 707         = GEN_INT (REG_BR_PROB_BASE - INTVAL (XEXP (XEXP (note, 0), 1)));
 708 }
 709
 710 /* Dump information about the branch prediction to the output file.  */
 711
 712 static void
 713 dump_prediction (FILE *file, enum br_predictor predictor, int probability,
 714                  basic_block bb, enum predictor_reason reason = REASON_NONE,
 715                  edge ep_edge = NULL)
 716 {
 717   edge e = ep_edge;
 718   edge_iterator ei;
 719
 720   if (!file)
 721     return;
 722
 723   if (e == NULL)
 724     FOR_EACH_EDGE (e, ei, bb->succs)
 725       if (! (e->flags & EDGE_FALLTHRU))
 726         break;
 727
 728   char edge_info_str[128];
 729   if (ep_edge)
 730     sprintf (edge_info_str, " of edge %d->%d", ep_edge->src->index,
 731              ep_edge->dest->index);
 732   else
 733     edge_info_str[0] = '\0';
 734
 735   fprintf (file, "  %s heuristics%s%s: %.1f%%",
 736            predictor_info[predictor].name,
 737            edge_info_str, reason_messages[reason],
 738            probability * 100.0 / REG_BR_PROB_BASE);
 739
 740   if (bb->count.initialized_p ())
 741     {
 742       fprintf (file, "  exec ");
 743       bb->count.dump (file);
 744       if (e)
 745         {
 746           fprintf (file, " hit ");
 747           e->count.dump (file);
 748           fprintf (file, " (%.1f%%)", e->count.to_gcov_type() * 100.0
 749                    / bb->count.to_gcov_type ());
 750         }
 751     }
 752
 753   fprintf (file, "\n");
 754 }
 755
 756 /* Return true if STMT is known to be unlikely executed.  */
 757
 758 static bool
 759 unlikely_executed_stmt_p (gimple *stmt)
 760 {
 761   if (!is_gimple_call (stmt))
 762     return false;
 763   /* NORETURN attribute alone is not strong enough: exit() may be quite
 764      likely executed once during program run.  */
 765   if (gimple_call_fntype (stmt)
 766       && lookup_attribute ("cold",
 767                            TYPE_ATTRIBUTES (gimple_call_fntype (stmt)))
 768       && !lookup_attribute ("cold", DECL_ATTRIBUTES (current_function_decl)))
 769     return true;
 770   tree decl = gimple_call_fndecl (stmt);
 771   if (!decl)
 772     return false;
 773   if (lookup_attribute ("cold", DECL_ATTRIBUTES (decl))
 774       && !lookup_attribute ("cold", DECL_ATTRIBUTES (current_function_decl)))
 775     return true;
 776
 777   cgraph_node *n = cgraph_node::get (decl);
 778   if (!n)
 779     return false;
 780
 781   availability avail;
 782   n = n->ultimate_alias_target (&avail);
 783   if (avail < AVAIL_AVAILABLE)
 784     return false;
 785   if (!n->analyzed
 786       || n->decl == current_function_decl)
 787     return false;
 788   return n->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED;
 789 }
 790
 791 /* Return true if BB is unlikely executed.  */
 792
 793 static bool
 794 unlikely_executed_bb_p (basic_block bb)
 795 {
 796   if (bb->count == profile_count::zero ())
 797     return true;
 798   if (bb == ENTRY_BLOCK_PTR_FOR_FN (cfun) || bb == EXIT_BLOCK_PTR_FOR_FN (cfun))
 799     return false;
 800   for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
 801        !gsi_end_p (gsi); gsi_next (&gsi))
 802     {
 803       if (unlikely_executed_stmt_p (gsi_stmt (gsi)))
 804         return true;
 805       if (stmt_can_terminate_bb_p (gsi_stmt (gsi)))
 806         return false;
 807     }
 808   return false;
 809 }
 810
 811 /* We can not predict the probabilities of outgoing edges of bb.  Set them
 812    evenly and hope for the best.  If UNLIKELY_EDGES is not null, distribute
 813    even probability for all edges not mentioned in the set.  These edges
 814    are given PROB_VERY_UNLIKELY probability.  */
 815
 816 static void
 817 set_even_probabilities (basic_block bb,
 818                         hash_set<edge> *unlikely_edges = NULL)
 819 {
 820   unsigned nedges = 0, unlikely_count = 0;
 821   edge e = NULL;
 822   edge_iterator ei;
 823   profile_probability all = profile_probability::always ();
 824
 825   FOR_EACH_EDGE (e, ei, bb->succs)
 826     if (e->probability.initialized_p ())
 827       all -= e->probability;
 828     else if (!unlikely_executed_edge_p (e))
 829       {
 830         nedges ++;
 831         if (unlikely_edges != NULL && unlikely_edges->contains (e))
 832           {
 833             all -= profile_probability::very_unlikely ();
 834             unlikely_count++;
 835           }
 836       }
 837
 838   /* Make the distribution even if all edges are unlikely.  */
 839   if (unlikely_count == nedges)
 840     {
 841       unlikely_edges = NULL;
 842       unlikely_count = 0;
 843     }
 844
 845   unsigned c = nedges - unlikely_count;
 846
 847   FOR_EACH_EDGE (e, ei, bb->succs)
 848     if (e->probability.initialized_p ())
 849       ;
 850     else if (!unlikely_executed_edge_p (e))
 851       {
 852         if (unlikely_edges != NULL && unlikely_edges->contains (e))
 853           e->probability = profile_probability::very_unlikely ();
 854         else
 855           e->probability = all.apply_scale (1, c).guessed ();
 856       }
 857     else
 858       e->probability = profile_probability::never ();
 859 }
 860
 861 /* Add REG_BR_PROB note to JUMP with PROB.  */
 862
 863 void
 864 add_reg_br_prob_note (rtx_insn *jump, profile_probability prob)
 865 {
 866   gcc_checking_assert (JUMP_P (jump) && !find_reg_note (jump, REG_BR_PROB, 0));
 867   add_int_reg_note (jump, REG_BR_PROB, prob.to_reg_br_prob_note ());
 868 }
 869
 870 /* Combine all REG_BR_PRED notes into single probability and attach REG_BR_PROB
 871    note if not already present.  Remove now useless REG_BR_PRED notes.  */
 872
 873 static void
 874 combine_predictions_for_insn (rtx_insn *insn, basic_block bb)
 875 {
 876   rtx prob_note;
 877   rtx *pnote;
 878   rtx note;
 879   int best_probability = PROB_EVEN;
 880   enum br_predictor best_predictor = END_PREDICTORS;
 881   int combined_probability = REG_BR_PROB_BASE / 2;
 882   int d;
 883   bool first_match = false;
 884   bool found = false;
 885
 886   if (!can_predict_insn_p (insn))
 887     {
 888       set_even_probabilities (bb);
 889       return;
 890     }
 891
 892   prob_note = find_reg_note (insn, REG_BR_PROB, 0);
 893   pnote = &REG_NOTES (insn);
 894   if (dump_file)
 895     fprintf (dump_file, "Predictions for insn %i bb %i\n", INSN_UID (insn),
 896              bb->index);
 897
 898   /* We implement "first match" heuristics and use probability guessed
 899      by predictor with smallest index.  */
 900   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
 901     if (REG_NOTE_KIND (note) == REG_BR_PRED)
 902       {
 903         enum br_predictor predictor = ((enum br_predictor)
 904                                        INTVAL (XEXP (XEXP (note, 0), 0)));
 905         int probability = INTVAL (XEXP (XEXP (note, 0), 1));
 906
 907         found = true;
 908         if (best_predictor > predictor
 909             && predictor_info[predictor].flags & PRED_FLAG_FIRST_MATCH)
 910           best_probability = probability, best_predictor = predictor;
 911
 912         d = (combined_probability * probability
 913              + (REG_BR_PROB_BASE - combined_probability)
 914              * (REG_BR_PROB_BASE - probability));
 915
 916         /* Use FP math to avoid overflows of 32bit integers.  */
 917         if (d == 0)
 918           /* If one probability is 0% and one 100%, avoid division by zero.  */
 919           combined_probability = REG_BR_PROB_BASE / 2;
 920         else
 921           combined_probability = (((double) combined_probability) * probability
 922                                   * REG_BR_PROB_BASE / d + 0.5);
 923       }
 924
 925   /* Decide which heuristic to use.  In case we didn't match anything,
 926      use no_prediction heuristic, in case we did match, use either
 927      first match or Dempster-Shaffer theory depending on the flags.  */
 928
 929   if (best_predictor != END_PREDICTORS)
 930     first_match = true;
 931
 932   if (!found)
 933     dump_prediction (dump_file, PRED_NO_PREDICTION,
 934                      combined_probability, bb);
 935   else
 936     {
 937       if (!first_match)
 938         dump_prediction (dump_file, PRED_DS_THEORY, combined_probability,
 939                          bb, !first_match ? REASON_NONE : REASON_IGNORED);
 940       else
 941         dump_prediction (dump_file, PRED_FIRST_MATCH, best_probability,
 942                          bb, first_match ? REASON_NONE : REASON_IGNORED);
 943     }
 944
 945   if (first_match)
 946     combined_probability = best_probability;
 947   dump_prediction (dump_file, PRED_COMBINED, combined_probability, bb);
 948
 949   while (*pnote)
 950     {
 951       if (REG_NOTE_KIND (*pnote) == REG_BR_PRED)
 952         {
 953           enum br_predictor predictor = ((enum br_predictor)
 954                                          INTVAL (XEXP (XEXP (*pnote, 0), 0)));
 955           int probability = INTVAL (XEXP (XEXP (*pnote, 0), 1));
 956
 957           dump_prediction (dump_file, predictor, probability, bb,
 958                            (!first_match || best_predictor == predictor)
 959                            ? REASON_NONE : REASON_IGNORED);
 960           *pnote = XEXP (*pnote, 1);
 961         }
 962       else
 963         pnote = &XEXP (*pnote, 1);
 964     }
 965
 966   if (!prob_note)
 967     {
 968       profile_probability p
 969          = profile_probability::from_reg_br_prob_base (combined_probability);
 970       add_reg_br_prob_note (insn, p);
 971
 972       /* Save the prediction into CFG in case we are seeing non-degenerated
 973          conditional jump.  */
 974       if (!single_succ_p (bb))
 975         {
 976           BRANCH_EDGE (bb)->probability = p;
 977           FALLTHRU_EDGE (bb)->probability
 978             = BRANCH_EDGE (bb)->probability.invert ();
 979         }
 980     }
 981   else if (!single_succ_p (bb))
 982     {
 983       profile_probability prob = profile_probability::from_reg_br_prob_note
 984                                         (XINT (prob_note, 0));
 985
 986       BRANCH_EDGE (bb)->probability = prob;
 987       FALLTHRU_EDGE (bb)->probability = prob.invert ();
 988     }
 989   else
 990     single_succ_edge (bb)->probability = profile_probability::always ();
 991 }
 992
 993 /* Edge prediction hash traits.  */
 994
 995 struct predictor_hash: pointer_hash <edge_prediction>
 996 {
 997
 998   static inline hashval_t hash (const edge_prediction *);
 999   static inline bool equal (const edge_prediction *, const edge_prediction *);
1000 };
1001
1002 /* Calculate hash value of an edge prediction P based on predictor and
1003    normalized probability.  */
1004
1005 inline hashval_t
1006 predictor_hash::hash (const edge_prediction *p)
1007 {
1008   inchash::hash hstate;
1009   hstate.add_int (p->ep_predictor);
1010
1011   int prob = p->ep_probability;
1012   if (prob > REG_BR_PROB_BASE / 2)
1013     prob = REG_BR_PROB_BASE - prob;
1014
1015   hstate.add_int (prob);
1016
1017   return hstate.end ();
1018 }
1019
1020 /* Return true whether edge predictions P1 and P2 use the same predictor and
1021    have equal (or opposed probability).  */
1022
1023 inline bool
1024 predictor_hash::equal (const edge_prediction *p1, const edge_prediction *p2)
1025 {
1026   return (p1->ep_predictor == p2->ep_predictor
1027           && (p1->ep_probability == p2->ep_probability
1028               || p1->ep_probability == REG_BR_PROB_BASE - p2->ep_probability));
1029 }
1030
1031 struct predictor_hash_traits: predictor_hash,
1032   typed_noop_remove <edge_prediction *> {};
1033
1034 /* Return true if edge prediction P is not in DATA hash set.  */
1035
1036 static bool
1037 not_removed_prediction_p (edge_prediction *p, void *data)
1038 {
1039   hash_set<edge_prediction *> *remove = (hash_set<edge_prediction *> *) data;
1040   return !remove->contains (p);
1041 }
1042
1043 /* Prune predictions for a basic block BB.  Currently we do following
1044    clean-up steps:
1045
1046    1) remove duplicate prediction that is guessed with the same probability
1047       (different than 1/2) to both edge
1048    2) remove duplicates for a prediction that belongs with the same probability
1049       to a single edge
1050
1051   */
1052
1053 static void
1054 prune_predictions_for_bb (basic_block bb)
1055 {
1056   edge_prediction **preds = bb_predictions->get (bb);
1057
1058   if (preds)
1059     {
1060       hash_table <predictor_hash_traits> s (13);
1061       hash_set <edge_prediction *> remove;
1062
1063       /* Step 1: identify predictors that should be removed.  */
1064       for (edge_prediction *pred = *preds; pred; pred = pred->ep_next)
1065         {
1066           edge_prediction *existing = s.find (pred);
1067           if (existing)
1068             {
1069               if (pred->ep_edge == existing->ep_edge
1070                   && pred->ep_probability == existing->ep_probability)
1071                 {
1072                   /* Remove a duplicate predictor.  */
1073                   dump_prediction (dump_file, pred->ep_predictor,
1074                                    pred->ep_probability, bb,
1075                                    REASON_SINGLE_EDGE_DUPLICATE, pred->ep_edge);
1076
1077                   remove.add (pred);
1078                 }
1079               else if (pred->ep_edge != existing->ep_edge
1080                        && pred->ep_probability == existing->ep_probability
1081                        && pred->ep_probability != REG_BR_PROB_BASE / 2)
1082                 {
1083                   /* Remove both predictors as they predict the same
1084                      for both edges.  */
1085                   dump_prediction (dump_file, existing->ep_predictor,
1086                                    pred->ep_probability, bb,
1087                                    REASON_EDGE_PAIR_DUPLICATE,
1088                                    existing->ep_edge);
1089                   dump_prediction (dump_file, pred->ep_predictor,
1090                                    pred->ep_probability, bb,
1091                                    REASON_EDGE_PAIR_DUPLICATE,
1092                                    pred->ep_edge);
1093
1094                   remove.add (existing);
1095                   remove.add (pred);
1096                 }
1097             }
1098
1099           edge_prediction **slot2 = s.find_slot (pred, INSERT);
1100           *slot2 = pred;
1101         }
1102
1103       /* Step 2: Remove predictors.  */
1104       filter_predictions (preds, not_removed_prediction_p, &remove);
1105     }
1106 }
1107
1108 /* Combine predictions into single probability and store them into CFG.
1109    Remove now useless prediction entries.
1110    If DRY_RUN is set, only produce dumps and do not modify profile.  */
1111
1112 static void
1113 combine_predictions_for_bb (basic_block bb, bool dry_run)
1114 {
1115   int best_probability = PROB_EVEN;
1116   enum br_predictor best_predictor = END_PREDICTORS;
1117   int combined_probability = REG_BR_PROB_BASE / 2;
1118   int d;
1119   bool first_match = false;
1120   bool found = false;
1121   struct edge_prediction *pred;
1122   int nedges = 0;
1123   edge e, first = NULL, second = NULL;
1124   edge_iterator ei;
1125
1126   FOR_EACH_EDGE (e, ei, bb->succs)
1127     if (!unlikely_executed_edge_p (e))
1128       {
1129         nedges ++;
1130         if (first && !second)
1131           second = e;
1132         if (!first)
1133           first = e;
1134       }
1135     else if (!e->probability.initialized_p ())
1136       e->probability = profile_probability::never ();
1137
1138   /* When there is no successor or only one choice, prediction is easy.
1139
1140      When we have a basic block with more than 2 successors, the situation
1141      is more complicated as DS theory cannot be used literally.
1142      More precisely, let's assume we predicted edge e1 with probability p1,
1143      thus: m1({b1}) = p1.  As we're going to combine more than 2 edges, we
1144      need to find probability of e.g. m1({b2}), which we don't know.
1145      The only approximation is to equally distribute 1-p1 to all edges
1146      different from b1.
1147
1148      According to numbers we've got from SPEC2006 benchark, there's only
1149      one interesting reliable predictor (noreturn call), which can be
1150      handled with a bit easier approach.  */
1151   if (nedges != 2)
1152     {
1153       hash_set<edge> unlikely_edges (4);
1154
1155       /* Identify all edges that have a probability close to very unlikely.
1156          Doing the approach for very unlikely doesn't worth for doing as
1157          there's no such probability in SPEC2006 benchmark.  */
1158       edge_prediction **preds = bb_predictions->get (bb);
1159       if (preds)
1160         for (pred = *preds; pred; pred = pred->ep_next)
1161           if (pred->ep_probability <= PROB_VERY_UNLIKELY)
1162             unlikely_edges.add (pred->ep_edge);
1163
1164       if (!dry_run)
1165         set_even_probabilities (bb, &unlikely_edges);
1166       clear_bb_predictions (bb);
1167       if (dump_file)
1168         {
1169           fprintf (dump_file, "Predictions for bb %i\n", bb->index);
1170           if (unlikely_edges.elements () == 0)
1171             fprintf (dump_file,
1172                      "%i edges in bb %i predicted to even probabilities\n",
1173                      nedges, bb->index);
1174           else
1175             {
1176               fprintf (dump_file,
1177                        "%i edges in bb %i predicted with some unlikely edges\n",
1178                        nedges, bb->index);
1179               FOR_EACH_EDGE (e, ei, bb->succs)
1180                 if (!unlikely_executed_edge_p (e))
1181                   dump_prediction (dump_file, PRED_COMBINED,
1182                    e->probability.to_reg_br_prob_base (), bb, REASON_NONE, e);
1183             }
1184         }
1185       return;
1186     }
1187
1188   if (dump_file)
1189     fprintf (dump_file, "Predictions for bb %i\n", bb->index);
1190
1191   prune_predictions_for_bb (bb);
1192
1193   edge_prediction **preds = bb_predictions->get (bb);
1194
1195   if (preds)
1196     {
1197       /* We implement "first match" heuristics and use probability guessed
1198          by predictor with smallest index.  */
1199       for (pred = *preds; pred; pred = pred->ep_next)
1200         {
1201           enum br_predictor predictor = pred->ep_predictor;
1202           int probability = pred->ep_probability;
1203
1204           if (pred->ep_edge != first)
1205             probability = REG_BR_PROB_BASE - probability;
1206
1207           found = true;
1208           /* First match heuristics would be widly confused if we predicted
1209              both directions.  */
1210           if (best_predictor > predictor
1211             && predictor_info[predictor].flags & PRED_FLAG_FIRST_MATCH)
1212             {
1213               struct edge_prediction *pred2;
1214               int prob = probability;
1215
1216               for (pred2 = (struct edge_prediction *) *preds;
1217                    pred2; pred2 = pred2->ep_next)
1218                if (pred2 != pred && pred2->ep_predictor == pred->ep_predictor)
1219                  {
1220                    int probability2 = pred2->ep_probability;
1221
1222                    if (pred2->ep_edge != first)
1223                      probability2 = REG_BR_PROB_BASE - probability2;
1224
1225                    if ((probability < REG_BR_PROB_BASE / 2) !=
1226                        (probability2 < REG_BR_PROB_BASE / 2))
1227                      break;
1228
1229                    /* If the same predictor later gave better result, go for it! */
1230                    if ((probability >= REG_BR_PROB_BASE / 2 && (probability2 > probability))
1231                        || (probability <= REG_BR_PROB_BASE / 2 && (probability2 < probability)))
1232                      prob = probability2;
1233                  }
1234               if (!pred2)
1235                 best_probability = prob, best_predictor = predictor;
1236             }
1237
1238           d = (combined_probability * probability
1239                + (REG_BR_PROB_BASE - combined_probability)
1240                * (REG_BR_PROB_BASE - probability));
1241
1242           /* Use FP math to avoid overflows of 32bit integers.  */
1243           if (d == 0)
1244             /* If one probability is 0% and one 100%, avoid division by zero.  */
1245             combined_probability = REG_BR_PROB_BASE / 2;
1246           else
1247             combined_probability = (((double) combined_probability)
1248                                     * probability
1249                                     * REG_BR_PROB_BASE / d + 0.5);
1250         }
1251     }
1252
1253   /* Decide which heuristic to use.  In case we didn't match anything,
1254      use no_prediction heuristic, in case we did match, use either
1255      first match or Dempster-Shaffer theory depending on the flags.  */
1256
1257   if (best_predictor != END_PREDICTORS)
1258     first_match = true;
1259
1260   if (!found)
1261     dump_prediction (dump_file, PRED_NO_PREDICTION, combined_probability, bb);
1262   else
1263     {
1264       if (!first_match)
1265         dump_prediction (dump_file, PRED_DS_THEORY, combined_probability, bb,
1266                          !first_match ? REASON_NONE : REASON_IGNORED);
1267       else
1268         dump_prediction (dump_file, PRED_FIRST_MATCH, best_probability, bb,
1269                          first_match ? REASON_NONE : REASON_IGNORED);
1270     }
1271
1272   if (first_match)
1273     combined_probability = best_probability;
1274   dump_prediction (dump_file, PRED_COMBINED, combined_probability, bb);
1275
1276   if (preds)
1277     {
1278       for (pred = (struct edge_prediction *) *preds; pred; pred = pred->ep_next)
1279         {
1280           enum br_predictor predictor = pred->ep_predictor;
1281           int probability = pred->ep_probability;
1282
1283           dump_prediction (dump_file, predictor, probability, bb,
1284                            (!first_match || best_predictor == predictor)
1285                            ? REASON_NONE : REASON_IGNORED, pred->ep_edge);
1286         }
1287     }
1288   clear_bb_predictions (bb);
1289
1290   if (!bb->count.initialized_p () && !dry_run)
1291     {
1292       first->probability
1293          = profile_probability::from_reg_br_prob_base (combined_probability);
1294       second->probability = first->probability.invert ();
1295     }
1296 }
1297
1298 /* Check if T1 and T2 satisfy the IV_COMPARE condition.
1299    Return the SSA_NAME if the condition satisfies, NULL otherwise.
1300
1301    T1 and T2 should be one of the following cases:
1302      1. T1 is SSA_NAME, T2 is NULL
1303      2. T1 is SSA_NAME, T2 is INTEGER_CST between [-4, 4]
1304      3. T2 is SSA_NAME, T1 is INTEGER_CST between [-4, 4]  */
1305
1306 static tree
1307 strips_small_constant (tree t1, tree t2)
1308 {
1309   tree ret = NULL;
1310   int value = 0;
1311
1312   if (!t1)
1313     return NULL;
1314   else if (TREE_CODE (t1) == SSA_NAME)
1315     ret = t1;
1316   else if (tree_fits_shwi_p (t1))
1317     value = tree_to_shwi (t1);
1318   else
1319     return NULL;
1320
1321   if (!t2)
1322     return ret;
1323   else if (tree_fits_shwi_p (t2))
1324     value = tree_to_shwi (t2);
1325   else if (TREE_CODE (t2) == SSA_NAME)
1326     {
1327       if (ret)
1328         return NULL;
1329       else
1330         ret = t2;
1331     }
1332
1333   if (value <= 4 && value >= -4)
1334     return ret;
1335   else
1336     return NULL;
1337 }
1338
1339 /* Return the SSA_NAME in T or T's operands.
1340    Return NULL if SSA_NAME cannot be found.  */
1341
1342 static tree
1343 get_base_value (tree t)
1344 {
1345   if (TREE_CODE (t) == SSA_NAME)
1346     return t;
1347
1348   if (!BINARY_CLASS_P (t))
1349     return NULL;
1350
1351   switch (TREE_OPERAND_LENGTH (t))
1352     {
1353     case 1:
1354       return strips_small_constant (TREE_OPERAND (t, 0), NULL);
1355     case 2:
1356       return strips_small_constant (TREE_OPERAND (t, 0),
1357                                     TREE_OPERAND (t, 1));
1358     default:
1359       return NULL;
1360     }
1361 }
1362
1363 /* Check the compare STMT in LOOP. If it compares an induction
1364    variable to a loop invariant, return true, and save
1365    LOOP_INVARIANT, COMPARE_CODE and LOOP_STEP.
1366    Otherwise return false and set LOOP_INVAIANT to NULL.  */
1367
1368 static bool
1369 is_comparison_with_loop_invariant_p (gcond *stmt, struct loop *loop,
1370                                      tree *loop_invariant,
1371                                      enum tree_code *compare_code,
1372                                      tree *loop_step,
1373                                      tree *loop_iv_base)
1374 {
1375   tree op0, op1, bound, base;
1376   affine_iv iv0, iv1;
1377   enum tree_code code;
1378   tree step;
1379
1380   code = gimple_cond_code (stmt);
1381   *loop_invariant = NULL;
1382
1383   switch (code)
1384     {
1385     case GT_EXPR:
1386     case GE_EXPR:
1387     case NE_EXPR:
1388     case LT_EXPR:
1389     case LE_EXPR:
1390     case EQ_EXPR:
1391       break;
1392
1393     default:
1394       return false;
1395     }
1396
1397   op0 = gimple_cond_lhs (stmt);
1398   op1 = gimple_cond_rhs (stmt);
1399
1400   if ((TREE_CODE (op0) != SSA_NAME && TREE_CODE (op0) != INTEGER_CST)
1401        || (TREE_CODE (op1) != SSA_NAME && TREE_CODE (op1) != INTEGER_CST))
1402     return false;
1403   if (!simple_iv (loop, loop_containing_stmt (stmt), op0, &iv0, true))
1404     return false;
1405   if (!simple_iv (loop, loop_containing_stmt (stmt), op1, &iv1, true))
1406     return false;
1407   if (TREE_CODE (iv0.step) != INTEGER_CST
1408       || TREE_CODE (iv1.step) != INTEGER_CST)
1409     return false;
1410   if ((integer_zerop (iv0.step) && integer_zerop (iv1.step))
1411       || (!integer_zerop (iv0.step) && !integer_zerop (iv1.step)))
1412     return false;
1413
1414   if (integer_zerop (iv0.step))
1415     {
1416       if (code != NE_EXPR && code != EQ_EXPR)
1417         code = invert_tree_comparison (code, false);
1418       bound = iv0.base;
1419       base = iv1.base;
1420       if (tree_fits_shwi_p (iv1.step))
1421         step = iv1.step;
1422       else
1423         return false;
1424     }
1425   else
1426     {
1427       bound = iv1.base;
1428       base = iv0.base;
1429       if (tree_fits_shwi_p (iv0.step))
1430         step = iv0.step;
1431       else
1432         return false;
1433     }
1434
1435   if (TREE_CODE (bound) != INTEGER_CST)
1436     bound = get_base_value (bound);
1437   if (!bound)
1438     return false;
1439   if (TREE_CODE (base) != INTEGER_CST)
1440     base = get_base_value (base);
1441   if (!base)
1442     return false;
1443
1444   *loop_invariant = bound;
1445   *compare_code = code;
1446   *loop_step = step;
1447   *loop_iv_base = base;
1448   return true;
1449 }
1450
1451 /* Compare two SSA_NAMEs: returns TRUE if T1 and T2 are value coherent.  */
1452
1453 static bool
1454 expr_coherent_p (tree t1, tree t2)
1455 {
1456   gimple *stmt;
1457   tree ssa_name_1 = NULL;
1458   tree ssa_name_2 = NULL;
1459
1460   gcc_assert (TREE_CODE (t1) == SSA_NAME || TREE_CODE (t1) == INTEGER_CST);
1461   gcc_assert (TREE_CODE (t2) == SSA_NAME || TREE_CODE (t2) == INTEGER_CST);
1462
1463   if (t1 == t2)
1464     return true;
1465
1466   if (TREE_CODE (t1) == INTEGER_CST && TREE_CODE (t2) == INTEGER_CST)
1467     return true;
1468   if (TREE_CODE (t1) == INTEGER_CST || TREE_CODE (t2) == INTEGER_CST)
1469     return false;
1470
1471   /* Check to see if t1 is expressed/defined with t2.  */
1472   stmt = SSA_NAME_DEF_STMT (t1);
1473   gcc_assert (stmt != NULL);
1474   if (is_gimple_assign (stmt))
1475     {
1476       ssa_name_1 = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
1477       if (ssa_name_1 && ssa_name_1 == t2)
1478         return true;
1479     }
1480
1481   /* Check to see if t2 is expressed/defined with t1.  */
1482   stmt = SSA_NAME_DEF_STMT (t2);
1483   gcc_assert (stmt != NULL);
1484   if (is_gimple_assign (stmt))
1485     {
1486       ssa_name_2 = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
1487       if (ssa_name_2 && ssa_name_2 == t1)
1488         return true;
1489     }
1490
1491   /* Compare if t1 and t2's def_stmts are identical.  */
1492   if (ssa_name_2 != NULL && ssa_name_1 == ssa_name_2)
1493     return true;
1494   else
1495     return false;
1496 }
1497
1498 /* Return true if E is predicted by one of loop heuristics.  */
1499
1500 static bool
1501 predicted_by_loop_heuristics_p (basic_block bb)
1502 {
1503   struct edge_prediction *i;
1504   edge_prediction **preds = bb_predictions->get (bb);
1505
1506   if (!preds)
1507     return false;
1508
1509   for (i = *preds; i; i = i->ep_next)
1510     if (i->ep_predictor == PRED_LOOP_ITERATIONS_GUESSED
1511         || i->ep_predictor == PRED_LOOP_ITERATIONS_MAX
1512         || i->ep_predictor == PRED_LOOP_ITERATIONS
1513         || i->ep_predictor == PRED_LOOP_EXIT
1514         || i->ep_predictor == PRED_LOOP_EXIT_WITH_RECURSION
1515         || i->ep_predictor == PRED_LOOP_EXTRA_EXIT)
1516       return true;
1517   return false;
1518 }
1519
1520 /* Predict branch probability of BB when BB contains a branch that compares
1521    an induction variable in LOOP with LOOP_IV_BASE_VAR to LOOP_BOUND_VAR. The
1522    loop exit is compared using LOOP_BOUND_CODE, with step of LOOP_BOUND_STEP.
1523
1524    E.g.
1525      for (int i = 0; i < bound; i++) {
1526        if (i < bound - 2)
1527          computation_1();
1528        else
1529          computation_2();
1530      }
1531
1532   In this loop, we will predict the branch inside the loop to be taken.  */
1533
1534 static void
1535 predict_iv_comparison (struct loop *loop, basic_block bb,
1536                        tree loop_bound_var,
1537                        tree loop_iv_base_var,
1538                        enum tree_code loop_bound_code,
1539                        int loop_bound_step)
1540 {
1541   gimple *stmt;
1542   tree compare_var, compare_base;
1543   enum tree_code compare_code;
1544   tree compare_step_var;
1545   edge then_edge;
1546   edge_iterator ei;
1547
1548   if (predicted_by_loop_heuristics_p (bb))
1549     return;
1550
1551   stmt = last_stmt (bb);
1552   if (!stmt || gimple_code (stmt) != GIMPLE_COND)
1553     return;
1554   if (!is_comparison_with_loop_invariant_p (as_a <gcond *> (stmt),
1555                                             loop, &compare_var,
1556                                             &compare_code,
1557                                             &compare_step_var,
1558                                             &compare_base))
1559     return;
1560
1561   /* Find the taken edge.  */
1562   FOR_EACH_EDGE (then_edge, ei, bb->succs)
1563     if (then_edge->flags & EDGE_TRUE_VALUE)
1564       break;
1565
1566   /* When comparing an IV to a loop invariant, NE is more likely to be
1567      taken while EQ is more likely to be not-taken.  */
1568   if (compare_code == NE_EXPR)
1569     {
1570       predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1571       return;
1572     }
1573   else if (compare_code == EQ_EXPR)
1574     {
1575       predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1576       return;
1577     }
1578
1579   if (!expr_coherent_p (loop_iv_base_var, compare_base))
1580     return;
1581
1582   /* If loop bound, base and compare bound are all constants, we can
1583      calculate the probability directly.  */
1584   if (tree_fits_shwi_p (loop_bound_var)
1585       && tree_fits_shwi_p (compare_var)
1586       && tree_fits_shwi_p (compare_base))
1587     {
1588       int probability;
1589       bool overflow, overall_overflow = false;
1590       widest_int compare_count, tem;
1591
1592       /* (loop_bound - base) / compare_step */
1593       tem = wi::sub (wi::to_widest (loop_bound_var),
1594                      wi::to_widest (compare_base), SIGNED, &overflow);
1595       overall_overflow |= overflow;
1596       widest_int loop_count = wi::div_trunc (tem,
1597                                              wi::to_widest (compare_step_var),
1598                                              SIGNED, &overflow);
1599       overall_overflow |= overflow;
1600
1601       if (!wi::neg_p (wi::to_widest (compare_step_var))
1602           ^ (compare_code == LT_EXPR || compare_code == LE_EXPR))
1603         {
1604           /* (loop_bound - compare_bound) / compare_step */
1605           tem = wi::sub (wi::to_widest (loop_bound_var),
1606                          wi::to_widest (compare_var), SIGNED, &overflow);
1607           overall_overflow |= overflow;
1608           compare_count = wi::div_trunc (tem, wi::to_widest (compare_step_var),
1609                                          SIGNED, &overflow);
1610           overall_overflow |= overflow;
1611         }
1612       else
1613         {
1614           /* (compare_bound - base) / compare_step */
1615           tem = wi::sub (wi::to_widest (compare_var),
1616                          wi::to_widest (compare_base), SIGNED, &overflow);
1617           overall_overflow |= overflow;
1618           compare_count = wi::div_trunc (tem, wi::to_widest (compare_step_var),
1619                                          SIGNED, &overflow);
1620           overall_overflow |= overflow;
1621         }
1622       if (compare_code == LE_EXPR || compare_code == GE_EXPR)
1623         ++compare_count;
1624       if (loop_bound_code == LE_EXPR || loop_bound_code == GE_EXPR)
1625         ++loop_count;
1626       if (wi::neg_p (compare_count))
1627         compare_count = 0;
1628       if (wi::neg_p (loop_count))
1629         loop_count = 0;
1630       if (loop_count == 0)
1631         probability = 0;
1632       else if (wi::cmps (compare_count, loop_count) == 1)
1633         probability = REG_BR_PROB_BASE;
1634       else
1635         {
1636           tem = compare_count * REG_BR_PROB_BASE;
1637           tem = wi::udiv_trunc (tem, loop_count);
1638           probability = tem.to_uhwi ();
1639         }
1640
1641       /* FIXME: The branch prediction seems broken. It has only 20% hitrate.  */
1642       if (!overall_overflow)
1643         predict_edge (then_edge, PRED_LOOP_IV_COMPARE, probability);
1644
1645       return;
1646     }
1647
1648   if (expr_coherent_p (loop_bound_var, compare_var))
1649     {
1650       if ((loop_bound_code == LT_EXPR || loop_bound_code == LE_EXPR)
1651           && (compare_code == LT_EXPR || compare_code == LE_EXPR))
1652         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1653       else if ((loop_bound_code == GT_EXPR || loop_bound_code == GE_EXPR)
1654                && (compare_code == GT_EXPR || compare_code == GE_EXPR))
1655         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1656       else if (loop_bound_code == NE_EXPR)
1657         {
1658           /* If the loop backedge condition is "(i != bound)", we do
1659              the comparison based on the step of IV:
1660              * step < 0 : backedge condition is like (i > bound)
1661              * step > 0 : backedge condition is like (i < bound)  */
1662           gcc_assert (loop_bound_step != 0);
1663           if (loop_bound_step > 0
1664               && (compare_code == LT_EXPR
1665                   || compare_code == LE_EXPR))
1666             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1667           else if (loop_bound_step < 0
1668                    && (compare_code == GT_EXPR
1669                        || compare_code == GE_EXPR))
1670             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1671           else
1672             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1673         }
1674       else
1675         /* The branch is predicted not-taken if loop_bound_code is
1676            opposite with compare_code.  */
1677         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1678     }
1679   else if (expr_coherent_p (loop_iv_base_var, compare_var))
1680     {
1681       /* For cases like:
1682            for (i = s; i < h; i++)
1683              if (i > s + 2) ....
1684          The branch should be predicted taken.  */
1685       if (loop_bound_step > 0
1686           && (compare_code == GT_EXPR || compare_code == GE_EXPR))
1687         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1688       else if (loop_bound_step < 0
1689                && (compare_code == LT_EXPR || compare_code == LE_EXPR))
1690         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1691       else
1692         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1693     }
1694 }
1695
1696 /* Predict for extra loop exits that will lead to EXIT_EDGE. The extra loop
1697    exits are resulted from short-circuit conditions that will generate an
1698    if_tmp. E.g.:
1699
1700    if (foo() || global > 10)
1701      break;
1702
1703    This will be translated into:
1704
1705    BB3:
1706      loop header...
1707    BB4:
1708      if foo() goto BB6 else goto BB5
1709    BB5:
1710      if global > 10 goto BB6 else goto BB7
1711    BB6:
1712      goto BB7
1713    BB7:
1714      iftmp = (PHI 0(BB5), 1(BB6))
1715      if iftmp == 1 goto BB8 else goto BB3
1716    BB8:
1717      outside of the loop...
1718
1719    The edge BB7->BB8 is loop exit because BB8 is outside of the loop.
1720    From the dataflow, we can infer that BB4->BB6 and BB5->BB6 are also loop
1721    exits. This function takes BB7->BB8 as input, and finds out the extra loop
1722    exits to predict them using PRED_LOOP_EXTRA_EXIT.  */
1723
1724 static void
1725 predict_extra_loop_exits (edge exit_edge)
1726 {
1727   unsigned i;
1728   bool check_value_one;
1729   gimple *lhs_def_stmt;
1730   gphi *phi_stmt;
1731   tree cmp_rhs, cmp_lhs;
1732   gimple *last;
1733   gcond *cmp_stmt;
1734
1735   last = last_stmt (exit_edge->src);
1736   if (!last)
1737     return;
1738   cmp_stmt = dyn_cast <gcond *> (last);
1739   if (!cmp_stmt)
1740     return;
1741
1742   cmp_rhs = gimple_cond_rhs (cmp_stmt);
1743   cmp_lhs = gimple_cond_lhs (cmp_stmt);
1744   if (!TREE_CONSTANT (cmp_rhs)
1745       || !(integer_zerop (cmp_rhs) || integer_onep (cmp_rhs)))
1746     return;
1747   if (TREE_CODE (cmp_lhs) != SSA_NAME)
1748     return;
1749
1750   /* If check_value_one is true, only the phi_args with value '1' will lead
1751      to loop exit. Otherwise, only the phi_args with value '0' will lead to
1752      loop exit.  */
1753   check_value_one = (((integer_onep (cmp_rhs))
1754                     ^ (gimple_cond_code (cmp_stmt) == EQ_EXPR))
1755                     ^ ((exit_edge->flags & EDGE_TRUE_VALUE) != 0));
1756
1757   lhs_def_stmt = SSA_NAME_DEF_STMT (cmp_lhs);
1758   if (!lhs_def_stmt)
1759     return;
1760
1761   phi_stmt = dyn_cast <gphi *> (lhs_def_stmt);
1762   if (!phi_stmt)
1763     return;
1764
1765   for (i = 0; i < gimple_phi_num_args (phi_stmt); i++)
1766     {
1767       edge e1;
1768       edge_iterator ei;
1769       tree val = gimple_phi_arg_def (phi_stmt, i);
1770       edge e = gimple_phi_arg_edge (phi_stmt, i);
1771
1772       if (!TREE_CONSTANT (val) || !(integer_zerop (val) || integer_onep (val)))
1773         continue;
1774       if ((check_value_one ^ integer_onep (val)) == 1)
1775         continue;
1776       if (EDGE_COUNT (e->src->succs) != 1)
1777         {
1778           predict_paths_leading_to_edge (e, PRED_LOOP_EXTRA_EXIT, NOT_TAKEN);
1779           continue;
1780         }
1781
1782       FOR_EACH_EDGE (e1, ei, e->src->preds)
1783         predict_paths_leading_to_edge (e1, PRED_LOOP_EXTRA_EXIT, NOT_TAKEN);
1784     }
1785 }
1786
1787
1788 /* Predict edge probabilities by exploiting loop structure.  */
1789
1790 static void
1791 predict_loops (void)
1792 {
1793   struct loop *loop;
1794   basic_block bb;
1795   hash_set <struct loop *> with_recursion(10);
1796
1797   FOR_EACH_BB_FN (bb, cfun)
1798     {
1799       gimple_stmt_iterator gsi;
1800       tree decl;
1801
1802       for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1803         if (is_gimple_call (gsi_stmt (gsi))
1804             && (decl = gimple_call_fndecl (gsi_stmt (gsi))) != NULL
1805             && recursive_call_p (current_function_decl, decl))
1806           {
1807             loop = bb->loop_father;
1808             while (loop && !with_recursion.add (loop))
1809               loop = loop_outer (loop);
1810           }
1811     }
1812
1813   /* Try to predict out blocks in a loop that are not part of a
1814      natural loop.  */
1815   FOR_EACH_LOOP (loop, LI_FROM_INNERMOST)
1816     {
1817       basic_block bb, *bbs;
1818       unsigned j, n_exits = 0;
1819       vec<edge> exits;
1820       struct tree_niter_desc niter_desc;
1821       edge ex;
1822       struct nb_iter_bound *nb_iter;
1823       enum tree_code loop_bound_code = ERROR_MARK;
1824       tree loop_bound_step = NULL;
1825       tree loop_bound_var = NULL;
1826       tree loop_iv_base = NULL;
1827       gcond *stmt = NULL;
1828       bool recursion = with_recursion.contains (loop);
1829
1830       exits = get_loop_exit_edges (loop);
1831       FOR_EACH_VEC_ELT (exits, j, ex)
1832         if (!unlikely_executed_edge_p (ex) && !(ex->flags & EDGE_ABNORMAL_CALL))
1833           n_exits ++;
1834       if (!n_exits)
1835         {
1836           exits.release ();
1837           continue;
1838         }
1839
1840       if (dump_file && (dump_flags & TDF_DETAILS))
1841         fprintf (dump_file, "Predicting loop %i%s with %i exits.\n",
1842                  loop->num, recursion ? " (with recursion)":"", n_exits);
1843       if (dump_file && (dump_flags & TDF_DETAILS)
1844           && max_loop_iterations_int (loop) >= 0)
1845         {
1846           fprintf (dump_file,
1847                    "Loop %d iterates at most %i times.\n", loop->num,
1848                    (int)max_loop_iterations_int (loop));
1849         }
1850       if (dump_file && (dump_flags & TDF_DETAILS)
1851           && likely_max_loop_iterations_int (loop) >= 0)
1852         {
1853           fprintf (dump_file, "Loop %d likely iterates at most %i times.\n",
1854                    loop->num, (int)likely_max_loop_iterations_int (loop));
1855         }
1856
1857       FOR_EACH_VEC_ELT (exits, j, ex)
1858         {
1859           tree niter = NULL;
1860           HOST_WIDE_INT nitercst;
1861           int max = PARAM_VALUE (PARAM_MAX_PREDICTED_ITERATIONS);
1862           int probability;
1863           enum br_predictor predictor;
1864           widest_int nit;
1865
1866           if (unlikely_executed_edge_p (ex)
1867               || (ex->flags & EDGE_ABNORMAL_CALL))
1868             continue;
1869           /* Loop heuristics do not expect exit conditional to be inside
1870              inner loop.  We predict from innermost to outermost loop.  */
1871           if (predicted_by_loop_heuristics_p (ex->src))
1872             {
1873               if (dump_file && (dump_flags & TDF_DETAILS))
1874                 fprintf (dump_file, "Skipping exit %i->%i because "
1875                          "it is already predicted.\n",
1876                          ex->src->index, ex->dest->index);
1877               continue;
1878             }
1879           predict_extra_loop_exits (ex);
1880
1881           if (number_of_iterations_exit (loop, ex, &niter_desc, false, false))
1882             niter = niter_desc.niter;
1883           if (!niter || TREE_CODE (niter_desc.niter) != INTEGER_CST)
1884             niter = loop_niter_by_eval (loop, ex);
1885           if (dump_file && (dump_flags & TDF_DETAILS)
1886               && TREE_CODE (niter) == INTEGER_CST)
1887             {
1888               fprintf (dump_file, "Exit %i->%i %d iterates ",
1889                        ex->src->index, ex->dest->index,
1890                        loop->num);
1891               print_generic_expr (dump_file, niter, TDF_SLIM);
1892               fprintf (dump_file, " times.\n");
1893             }
1894
1895           if (TREE_CODE (niter) == INTEGER_CST)
1896             {
1897               if (tree_fits_uhwi_p (niter)
1898                   && max
1899                   && compare_tree_int (niter, max - 1) == -1)
1900                 nitercst = tree_to_uhwi (niter) + 1;
1901               else
1902                 nitercst = max;
1903               predictor = PRED_LOOP_ITERATIONS;
1904             }
1905           /* If we have just one exit and we can derive some information about
1906              the number of iterations of the loop from the statements inside
1907              the loop, use it to predict this exit.  */
1908           else if (n_exits == 1
1909                    && estimated_stmt_executions (loop, &nit))
1910             {
1911               if (wi::gtu_p (nit, max))
1912                 nitercst = max;
1913               else
1914                 nitercst = nit.to_shwi ();
1915               predictor = PRED_LOOP_ITERATIONS_GUESSED;
1916             }
1917           /* If we have likely upper bound, trust it for very small iteration
1918              counts.  Such loops would otherwise get mispredicted by standard
1919              LOOP_EXIT heuristics.  */
1920           else if (n_exits == 1
1921                    && likely_max_stmt_executions (loop, &nit)
1922                    && wi::ltu_p (nit,
1923                                  RDIV (REG_BR_PROB_BASE,
1924                                        REG_BR_PROB_BASE
1925                                          - predictor_info
1926                                                  [recursion
1927                                                   ? PRED_LOOP_EXIT_WITH_RECURSION
1928                                                   : PRED_LOOP_EXIT].hitrate)))
1929             {
1930               nitercst = nit.to_shwi ();
1931               predictor = PRED_LOOP_ITERATIONS_MAX;
1932             }
1933           else
1934             {
1935               if (dump_file && (dump_flags & TDF_DETAILS))
1936                 fprintf (dump_file, "Nothing known about exit %i->%i.\n",
1937                          ex->src->index, ex->dest->index);
1938               continue;
1939             }
1940
1941           if (dump_file && (dump_flags & TDF_DETAILS))
1942             fprintf (dump_file, "Recording prediction to %i iterations by %s.\n",
1943                      (int)nitercst, predictor_info[predictor].name);
1944           /* If the prediction for number of iterations is zero, do not
1945              predict the exit edges.  */
1946           if (nitercst == 0)
1947             continue;
1948
1949           probability = RDIV (REG_BR_PROB_BASE, nitercst);
1950           predict_edge (ex, predictor, probability);
1951         }
1952       exits.release ();
1953
1954       /* Find information about loop bound variables.  */
1955       for (nb_iter = loop->bounds; nb_iter;
1956            nb_iter = nb_iter->next)
1957         if (nb_iter->stmt
1958             && gimple_code (nb_iter->stmt) == GIMPLE_COND)
1959           {
1960             stmt = as_a <gcond *> (nb_iter->stmt);
1961             break;
1962           }
1963       if (!stmt && last_stmt (loop->header)
1964           && gimple_code (last_stmt (loop->header)) == GIMPLE_COND)
1965         stmt = as_a <gcond *> (last_stmt (loop->header));
1966       if (stmt)
1967         is_comparison_with_loop_invariant_p (stmt, loop,
1968                                              &loop_bound_var,
1969                                              &loop_bound_code,
1970                                              &loop_bound_step,
1971                                              &loop_iv_base);
1972
1973       bbs = get_loop_body (loop);
1974
1975       for (j = 0; j < loop->num_nodes; j++)
1976         {
1977           edge e;
1978           edge_iterator ei;
1979
1980           bb = bbs[j];
1981
1982           /* Bypass loop heuristics on continue statement.  These
1983              statements construct loops via "non-loop" constructs
1984              in the source language and are better to be handled
1985              separately.  */
1986           if (predicted_by_p (bb, PRED_CONTINUE))
1987             {
1988               if (dump_file && (dump_flags & TDF_DETAILS))
1989                 fprintf (dump_file, "BB %i predicted by continue.\n",
1990                          bb->index);
1991               continue;
1992             }
1993
1994           /* If we already used more reliable loop exit predictors, do not
1995              bother with PRED_LOOP_EXIT.  */
1996           if (!predicted_by_loop_heuristics_p (bb))
1997             {
1998               /* For loop with many exits we don't want to predict all exits
1999                  with the pretty large probability, because if all exits are
2000                  considered in row, the loop would be predicted to iterate
2001                  almost never.  The code to divide probability by number of
2002                  exits is very rough.  It should compute the number of exits
2003                  taken in each patch through function (not the overall number
2004                  of exits that might be a lot higher for loops with wide switch
2005                  statements in them) and compute n-th square root.
2006
2007                  We limit the minimal probability by 2% to avoid
2008                  EDGE_PROBABILITY_RELIABLE from trusting the branch prediction
2009                  as this was causing regression in perl benchmark containing such
2010                  a wide loop.  */
2011
2012               int probability = ((REG_BR_PROB_BASE
2013                                   - predictor_info
2014                                      [recursion
2015                                       ? PRED_LOOP_EXIT_WITH_RECURSION
2016                                       : PRED_LOOP_EXIT].hitrate)
2017                                  / n_exits);
2018               if (probability < HITRATE (2))
2019                 probability = HITRATE (2);
2020               FOR_EACH_EDGE (e, ei, bb->succs)
2021                 if (e->dest->index < NUM_FIXED_BLOCKS
2022                     || !flow_bb_inside_loop_p (loop, e->dest))
2023                   {
2024                     if (dump_file && (dump_flags & TDF_DETAILS))
2025                       fprintf (dump_file,
2026                                "Predicting exit %i->%i with prob %i.\n",
2027                                e->src->index, e->dest->index, probability);
2028                     predict_edge (e,
2029                                   recursion ? PRED_LOOP_EXIT_WITH_RECURSION
2030                                   : PRED_LOOP_EXIT, probability);
2031                   }
2032             }
2033           if (loop_bound_var)
2034             predict_iv_comparison (loop, bb, loop_bound_var, loop_iv_base,
2035                                    loop_bound_code,
2036                                    tree_to_shwi (loop_bound_step));
2037         }
2038
2039       /* In the following code
2040          for (loop1)
2041            if (cond)
2042              for (loop2)
2043                body;
2044          guess that cond is unlikely.  */
2045       if (loop_outer (loop)->num)
2046         {
2047           basic_block bb = NULL;
2048           edge preheader_edge = loop_preheader_edge (loop);
2049
2050           if (single_pred_p (preheader_edge->src)
2051               && single_succ_p (preheader_edge->src))
2052             preheader_edge = single_pred_edge (preheader_edge->src);
2053
2054           gimple *stmt = last_stmt (preheader_edge->src);
2055           /* Pattern match fortran loop preheader:
2056              _16 = BUILTIN_EXPECT (_15, 1, PRED_FORTRAN_LOOP_PREHEADER);
2057              _17 = (logical(kind=4)) _16;
2058              if (_17 != 0)
2059                goto <bb 11>;
2060              else
2061                goto <bb 13>;
2062
2063              Loop guard branch prediction says nothing about duplicated loop
2064              headers produced by fortran frontend and in this case we want
2065              to predict paths leading to this preheader.  */
2066
2067           if (stmt
2068               && gimple_code (stmt) == GIMPLE_COND
2069               && gimple_cond_code (stmt) == NE_EXPR
2070               && TREE_CODE (gimple_cond_lhs (stmt)) == SSA_NAME
2071               && integer_zerop (gimple_cond_rhs (stmt)))
2072              {
2073                gimple *call_stmt = SSA_NAME_DEF_STMT (gimple_cond_lhs (stmt));
2074                if (gimple_code (call_stmt) == GIMPLE_ASSIGN
2075                    && gimple_expr_code (call_stmt) == NOP_EXPR
2076                    && TREE_CODE (gimple_assign_rhs1 (call_stmt)) == SSA_NAME)
2077                  call_stmt = SSA_NAME_DEF_STMT (gimple_assign_rhs1 (call_stmt));
2078                if (gimple_call_internal_p (call_stmt, IFN_BUILTIN_EXPECT)
2079                    && TREE_CODE (gimple_call_arg (call_stmt, 2)) == INTEGER_CST
2080                    && tree_fits_uhwi_p (gimple_call_arg (call_stmt, 2))
2081                    && tree_to_uhwi (gimple_call_arg (call_stmt, 2))
2082                         == PRED_FORTRAN_LOOP_PREHEADER)
2083                  bb = preheader_edge->src;
2084              }
2085           if (!bb)
2086             {
2087               if (!dominated_by_p (CDI_DOMINATORS,
2088                                    loop_outer (loop)->latch, loop->header))
2089                 predict_paths_leading_to_edge (loop_preheader_edge (loop),
2090                                                recursion
2091                                                ? PRED_LOOP_GUARD_WITH_RECURSION
2092                                                : PRED_LOOP_GUARD,
2093                                                NOT_TAKEN,
2094                                                loop_outer (loop));
2095             }
2096           else
2097             {
2098               if (!dominated_by_p (CDI_DOMINATORS,
2099                                    loop_outer (loop)->latch, bb))
2100                 predict_paths_leading_to (bb,
2101                                           recursion
2102                                           ? PRED_LOOP_GUARD_WITH_RECURSION
2103                                           : PRED_LOOP_GUARD,
2104                                           NOT_TAKEN,
2105                                           loop_outer (loop));
2106             }
2107         }
2108
2109       /* Free basic blocks from get_loop_body.  */
2110       free (bbs);
2111     }
2112 }
2113
2114 /* Attempt to predict probabilities of BB outgoing edges using local
2115    properties.  */
2116 static void
2117 bb_estimate_probability_locally (basic_block bb)
2118 {
2119   rtx_insn *last_insn = BB_END (bb);
2120   rtx cond;
2121
2122   if (! can_predict_insn_p (last_insn))
2123     return;
2124   cond = get_condition (last_insn, NULL, false, false);
2125   if (! cond)
2126     return;
2127
2128   /* Try "pointer heuristic."
2129      A comparison ptr == 0 is predicted as false.
2130      Similarly, a comparison ptr1 == ptr2 is predicted as false.  */
2131   if (COMPARISON_P (cond)
2132       && ((REG_P (XEXP (cond, 0)) && REG_POINTER (XEXP (cond, 0)))
2133           || (REG_P (XEXP (cond, 1)) && REG_POINTER (XEXP (cond, 1)))))
2134     {
2135       if (GET_CODE (cond) == EQ)
2136         predict_insn_def (last_insn, PRED_POINTER, NOT_TAKEN);
2137       else if (GET_CODE (cond) == NE)
2138         predict_insn_def (last_insn, PRED_POINTER, TAKEN);
2139     }
2140   else
2141
2142   /* Try "opcode heuristic."
2143      EQ tests are usually false and NE tests are usually true. Also,
2144      most quantities are positive, so we can make the appropriate guesses
2145      about signed comparisons against zero.  */
2146     switch (GET_CODE (cond))
2147       {
2148       case CONST_INT:
2149         /* Unconditional branch.  */
2150         predict_insn_def (last_insn, PRED_UNCONDITIONAL,
2151                           cond == const0_rtx ? NOT_TAKEN : TAKEN);
2152         break;
2153
2154       case EQ:
2155       case UNEQ:
2156         /* Floating point comparisons appears to behave in a very
2157            unpredictable way because of special role of = tests in
2158            FP code.  */
2159         if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
2160           ;
2161         /* Comparisons with 0 are often used for booleans and there is
2162            nothing useful to predict about them.  */
2163         else if (XEXP (cond, 1) == const0_rtx
2164                  || XEXP (cond, 0) == const0_rtx)
2165           ;
2166         else
2167           predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, NOT_TAKEN);
2168         break;
2169
2170       case NE:
2171       case LTGT:
2172         /* Floating point comparisons appears to behave in a very
2173            unpredictable way because of special role of = tests in
2174            FP code.  */
2175         if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
2176           ;
2177         /* Comparisons with 0 are often used for booleans and there is
2178            nothing useful to predict about them.  */
2179         else if (XEXP (cond, 1) == const0_rtx
2180                  || XEXP (cond, 0) == const0_rtx)
2181           ;
2182         else
2183           predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, TAKEN);
2184         break;
2185
2186       case ORDERED:
2187         predict_insn_def (last_insn, PRED_FPOPCODE, TAKEN);
2188         break;
2189
2190       case UNORDERED:
2191         predict_insn_def (last_insn, PRED_FPOPCODE, NOT_TAKEN);
2192         break;
2193
2194       case LE:
2195       case LT:
2196         if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
2197             || XEXP (cond, 1) == constm1_rtx)
2198           predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, NOT_TAKEN);
2199         break;
2200
2201       case GE:
2202       case GT:
2203         if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
2204             || XEXP (cond, 1) == constm1_rtx)
2205           predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, TAKEN);
2206         break;
2207
2208       default:
2209         break;
2210       }
2211 }
2212
2213 /* Set edge->probability for each successor edge of BB.  */
2214 void
2215 guess_outgoing_edge_probabilities (basic_block bb)
2216 {
2217   bb_estimate_probability_locally (bb);
2218   combine_predictions_for_insn (BB_END (bb), bb);
2219 }
2220 \f
2221 static tree expr_expected_value (tree, bitmap, enum br_predictor *predictor);
2222
2223 /* Helper function for expr_expected_value.  */
2224
2225 static tree
2226 expr_expected_value_1 (tree type, tree op0, enum tree_code code,
2227                        tree op1, bitmap visited, enum br_predictor *predictor)
2228 {
2229   gimple *def;
2230
2231   if (predictor)
2232     *predictor = PRED_UNCONDITIONAL;
2233
2234   if (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS)
2235     {
2236       if (TREE_CONSTANT (op0))
2237         return op0;
2238
2239       if (code == IMAGPART_EXPR)
2240         {
2241           if (TREE_CODE (TREE_OPERAND (op0, 0)) == SSA_NAME)
2242             {
2243               def = SSA_NAME_DEF_STMT (TREE_OPERAND (op0, 0));
2244               if (is_gimple_call (def)
2245                   && gimple_call_internal_p (def)
2246                   && (gimple_call_internal_fn (def)
2247                       == IFN_ATOMIC_COMPARE_EXCHANGE))
2248                 {
2249                   /* Assume that any given atomic operation has low contention,
2250                      and thus the compare-and-swap operation succeeds.  */
2251                   if (predictor)
2252                     *predictor = PRED_COMPARE_AND_SWAP;
2253                   return build_one_cst (TREE_TYPE (op0));
2254                 }
2255             }
2256         }
2257
2258       if (code != SSA_NAME)
2259         return NULL_TREE;
2260
2261       def = SSA_NAME_DEF_STMT (op0);
2262
2263       /* If we were already here, break the infinite cycle.  */
2264       if (!bitmap_set_bit (visited, SSA_NAME_VERSION (op0)))
2265         return NULL;
2266
2267       if (gimple_code (def) == GIMPLE_PHI)
2268         {
2269           /* All the arguments of the PHI node must have the same constant
2270              length.  */
2271           int i, n = gimple_phi_num_args (def);
2272           tree val = NULL, new_val;
2273
2274           for (i = 0; i < n; i++)
2275             {
2276               tree arg = PHI_ARG_DEF (def, i);
2277               enum br_predictor predictor2;
2278
2279               /* If this PHI has itself as an argument, we cannot
2280                  determine the string length of this argument.  However,
2281                  if we can find an expected constant value for the other
2282                  PHI args then we can still be sure that this is
2283                  likely a constant.  So be optimistic and just
2284                  continue with the next argument.  */
2285               if (arg == PHI_RESULT (def))
2286                 continue;
2287
2288               new_val = expr_expected_value (arg, visited, &predictor2);
2289
2290               /* It is difficult to combine value predictors.  Simply assume
2291                  that later predictor is weaker and take its prediction.  */
2292               if (predictor && *predictor < predictor2)
2293                 *predictor = predictor2;
2294               if (!new_val)
2295                 return NULL;
2296               if (!val)
2297                 val = new_val;
2298               else if (!operand_equal_p (val, new_val, false))
2299                 return NULL;
2300             }
2301           return val;
2302         }
2303       if (is_gimple_assign (def))
2304         {
2305           if (gimple_assign_lhs (def) != op0)
2306             return NULL;
2307
2308           return expr_expected_value_1 (TREE_TYPE (gimple_assign_lhs (def)),
2309                                         gimple_assign_rhs1 (def),
2310                                         gimple_assign_rhs_code (def),
2311                                         gimple_assign_rhs2 (def),
2312                                         visited, predictor);
2313         }
2314
2315       if (is_gimple_call (def))
2316         {
2317           tree decl = gimple_call_fndecl (def);
2318           if (!decl)
2319             {
2320               if (gimple_call_internal_p (def)
2321                   && gimple_call_internal_fn (def) == IFN_BUILTIN_EXPECT)
2322                 {
2323                   gcc_assert (gimple_call_num_args (def) == 3);
2324                   tree val = gimple_call_arg (def, 0);
2325                   if (TREE_CONSTANT (val))
2326                     return val;
2327                   if (predictor)
2328                     {
2329                       tree val2 = gimple_call_arg (def, 2);
2330                       gcc_assert (TREE_CODE (val2) == INTEGER_CST
2331                                   && tree_fits_uhwi_p (val2)
2332                                   && tree_to_uhwi (val2) < END_PREDICTORS);
2333                       *predictor = (enum br_predictor) tree_to_uhwi (val2);
2334                     }
2335                   return gimple_call_arg (def, 1);
2336                 }
2337               return NULL;
2338             }
2339           if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
2340             switch (DECL_FUNCTION_CODE (decl))
2341               {
2342               case BUILT_IN_EXPECT:
2343                 {
2344                   tree val;
2345                   if (gimple_call_num_args (def) != 2)
2346                     return NULL;
2347                   val = gimple_call_arg (def, 0);
2348                   if (TREE_CONSTANT (val))
2349                     return val;
2350                   if (predictor)
2351                     *predictor = PRED_BUILTIN_EXPECT;
2352                   return gimple_call_arg (def, 1);
2353                 }
2354
2355               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_N:
2356               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_1:
2357               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_2:
2358               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_4:
2359               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_8:
2360               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_16:
2361               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE:
2362               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_N:
2363               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_1:
2364               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_2:
2365               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_4:
2366               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_8:
2367               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_16:
2368                 /* Assume that any given atomic operation has low contention,
2369                    and thus the compare-and-swap operation succeeds.  */
2370                 if (predictor)
2371                   *predictor = PRED_COMPARE_AND_SWAP;
2372                 return boolean_true_node;
2373               default:
2374                 break;
2375             }
2376         }
2377
2378       return NULL;
2379     }
2380
2381   if (get_gimple_rhs_class (code) == GIMPLE_BINARY_RHS)
2382     {
2383       tree res;
2384       enum br_predictor predictor2;
2385       op0 = expr_expected_value (op0, visited, predictor);
2386       if (!op0)
2387         return NULL;
2388       op1 = expr_expected_value (op1, visited, &predictor2);
2389       if (predictor && *predictor < predictor2)
2390         *predictor = predictor2;
2391       if (!op1)
2392         return NULL;
2393       res = fold_build2 (code, type, op0, op1);
2394       if (TREE_CONSTANT (res))
2395         return res;
2396       return NULL;
2397     }
2398   if (get_gimple_rhs_class (code) == GIMPLE_UNARY_RHS)
2399     {
2400       tree res;
2401       op0 = expr_expected_value (op0, visited, predictor);
2402       if (!op0)
2403         return NULL;
2404       res = fold_build1 (code, type, op0);
2405       if (TREE_CONSTANT (res))
2406         return res;
2407       return NULL;
2408     }
2409   return NULL;
2410 }
2411
2412 /* Return constant EXPR will likely have at execution time, NULL if unknown.
2413    The function is used by builtin_expect branch predictor so the evidence
2414    must come from this construct and additional possible constant folding.
2415
2416    We may want to implement more involved value guess (such as value range
2417    propagation based prediction), but such tricks shall go to new
2418    implementation.  */
2419
2420 static tree
2421 expr_expected_value (tree expr, bitmap visited,
2422                      enum br_predictor *predictor)
2423 {
2424   enum tree_code code;
2425   tree op0, op1;
2426
2427   if (TREE_CONSTANT (expr))
2428     {
2429       if (predictor)
2430         *predictor = PRED_UNCONDITIONAL;
2431       return expr;
2432     }
2433
2434   extract_ops_from_tree (expr, &code, &op0, &op1);
2435   return expr_expected_value_1 (TREE_TYPE (expr),
2436                                 op0, code, op1, visited, predictor);
2437 }
2438 \f
2439 /* Predict using opcode of the last statement in basic block.  */
2440 static void
2441 tree_predict_by_opcode (basic_block bb)
2442 {
2443   gimple *stmt = last_stmt (bb);
2444   edge then_edge;
2445   tree op0, op1;
2446   tree type;
2447   tree val;
2448   enum tree_code cmp;
2449   edge_iterator ei;
2450   enum br_predictor predictor;
2451
2452   if (!stmt || gimple_code (stmt) != GIMPLE_COND)
2453     return;
2454   FOR_EACH_EDGE (then_edge, ei, bb->succs)
2455     if (then_edge->flags & EDGE_TRUE_VALUE)
2456       break;
2457   op0 = gimple_cond_lhs (stmt);
2458   op1 = gimple_cond_rhs (stmt);
2459   cmp = gimple_cond_code (stmt);
2460   type = TREE_TYPE (op0);
2461   val = expr_expected_value_1 (boolean_type_node, op0, cmp, op1, auto_bitmap (),
2462                                &predictor);
2463   if (val && TREE_CODE (val) == INTEGER_CST)
2464     {
2465       if (predictor == PRED_BUILTIN_EXPECT)
2466         {
2467           int percent = PARAM_VALUE (BUILTIN_EXPECT_PROBABILITY);
2468
2469           gcc_assert (percent >= 0 && percent <= 100);
2470           if (integer_zerop (val))
2471             percent = 100 - percent;
2472           predict_edge (then_edge, PRED_BUILTIN_EXPECT, HITRATE (percent));
2473         }
2474       else
2475         predict_edge_def (then_edge, predictor,
2476                           integer_zerop (val) ? NOT_TAKEN : TAKEN);
2477     }
2478   /* Try "pointer heuristic."
2479      A comparison ptr == 0 is predicted as false.
2480      Similarly, a comparison ptr1 == ptr2 is predicted as false.  */
2481   if (POINTER_TYPE_P (type))
2482     {
2483       if (cmp == EQ_EXPR)
2484         predict_edge_def (then_edge, PRED_TREE_POINTER, NOT_TAKEN);
2485       else if (cmp == NE_EXPR)
2486         predict_edge_def (then_edge, PRED_TREE_POINTER, TAKEN);
2487     }
2488   else
2489
2490   /* Try "opcode heuristic."
2491      EQ tests are usually false and NE tests are usually true. Also,
2492      most quantities are positive, so we can make the appropriate guesses
2493      about signed comparisons against zero.  */
2494     switch (cmp)
2495       {
2496       case EQ_EXPR:
2497       case UNEQ_EXPR:
2498         /* Floating point comparisons appears to behave in a very
2499            unpredictable way because of special role of = tests in
2500            FP code.  */
2501         if (FLOAT_TYPE_P (type))
2502           ;
2503         /* Comparisons with 0 are often used for booleans and there is
2504            nothing useful to predict about them.  */
2505         else if (integer_zerop (op0) || integer_zerop (op1))
2506           ;
2507         else
2508           predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, NOT_TAKEN);
2509         break;
2510
2511       case NE_EXPR:
2512       case LTGT_EXPR:
2513         /* Floating point comparisons appears to behave in a very
2514            unpredictable way because of special role of = tests in
2515            FP code.  */
2516         if (FLOAT_TYPE_P (type))
2517           ;
2518         /* Comparisons with 0 are often used for booleans and there is
2519            nothing useful to predict about them.  */
2520         else if (integer_zerop (op0)
2521                  || integer_zerop (op1))
2522           ;
2523         else
2524           predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, TAKEN);
2525         break;
2526
2527       case ORDERED_EXPR:
2528         predict_edge_def (then_edge, PRED_TREE_FPOPCODE, TAKEN);
2529         break;
2530
2531       case UNORDERED_EXPR:
2532         predict_edge_def (then_edge, PRED_TREE_FPOPCODE, NOT_TAKEN);
2533         break;
2534
2535       case LE_EXPR:
2536       case LT_EXPR:
2537         if (integer_zerop (op1)
2538             || integer_onep (op1)
2539             || integer_all_onesp (op1)
2540             || real_zerop (op1)
2541             || real_onep (op1)
2542             || real_minus_onep (op1))
2543           predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, NOT_TAKEN);
2544         break;
2545
2546       case GE_EXPR:
2547       case GT_EXPR:
2548         if (integer_zerop (op1)
2549             || integer_onep (op1)
2550             || integer_all_onesp (op1)
2551             || real_zerop (op1)
2552             || real_onep (op1)
2553             || real_minus_onep (op1))
2554           predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, TAKEN);
2555         break;
2556
2557       default:
2558         break;
2559       }
2560 }
2561
2562 /* Returns TRUE if the STMT is exit(0) like statement. */
2563
2564 static bool
2565 is_exit_with_zero_arg (const gimple *stmt)
2566 {
2567   /* This is not exit, _exit or _Exit. */
2568   if (!gimple_call_builtin_p (stmt, BUILT_IN_EXIT)
2569       && !gimple_call_builtin_p (stmt, BUILT_IN__EXIT)
2570       && !gimple_call_builtin_p (stmt, BUILT_IN__EXIT2))
2571     return false;
2572
2573   /* Argument is an interger zero. */
2574   return integer_zerop (gimple_call_arg (stmt, 0));
2575 }
2576
2577 /* Try to guess whether the value of return means error code.  */
2578
2579 static enum br_predictor
2580 return_prediction (tree val, enum prediction *prediction)
2581 {
2582   /* VOID.  */
2583   if (!val)
2584     return PRED_NO_PREDICTION;
2585   /* Different heuristics for pointers and scalars.  */
2586   if (POINTER_TYPE_P (TREE_TYPE (val)))
2587     {
2588       /* NULL is usually not returned.  */
2589       if (integer_zerop (val))
2590         {
2591           *prediction = NOT_TAKEN;
2592           return PRED_NULL_RETURN;
2593         }
2594     }
2595   else if (INTEGRAL_TYPE_P (TREE_TYPE (val)))
2596     {
2597       /* Negative return values are often used to indicate
2598          errors.  */
2599       if (TREE_CODE (val) == INTEGER_CST
2600           && tree_int_cst_sgn (val) < 0)
2601         {
2602           *prediction = NOT_TAKEN;
2603           return PRED_NEGATIVE_RETURN;
2604         }
2605       /* Constant return values seems to be commonly taken.
2606          Zero/one often represent booleans so exclude them from the
2607          heuristics.  */
2608       if (TREE_CONSTANT (val)
2609           && (!integer_zerop (val) && !integer_onep (val)))
2610         {
2611           *prediction = NOT_TAKEN;
2612           return PRED_CONST_RETURN;
2613         }
2614     }
2615   return PRED_NO_PREDICTION;
2616 }
2617
2618 /* Find the basic block with return expression and look up for possible
2619    return value trying to apply RETURN_PREDICTION heuristics.  */
2620 static void
2621 apply_return_prediction (void)
2622 {
2623   greturn *return_stmt = NULL;
2624   tree return_val;
2625   edge e;
2626   gphi *phi;
2627   int phi_num_args, i;
2628   enum br_predictor pred;
2629   enum prediction direction;
2630   edge_iterator ei;
2631
2632   FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
2633     {
2634       gimple *last = last_stmt (e->src);
2635       if (last
2636           && gimple_code (last) == GIMPLE_RETURN)
2637         {
2638           return_stmt = as_a <greturn *> (last);
2639           break;
2640         }
2641     }
2642   if (!e)
2643     return;
2644   return_val = gimple_return_retval (return_stmt);
2645   if (!return_val)
2646     return;
2647   if (TREE_CODE (return_val) != SSA_NAME
2648       || !SSA_NAME_DEF_STMT (return_val)
2649       || gimple_code (SSA_NAME_DEF_STMT (return_val)) != GIMPLE_PHI)
2650     return;
2651   phi = as_a <gphi *> (SSA_NAME_DEF_STMT (return_val));
2652   phi_num_args = gimple_phi_num_args (phi);
2653   pred = return_prediction (PHI_ARG_DEF (phi, 0), &direction);
2654
2655   /* Avoid the degenerate case where all return values form the function
2656      belongs to same category (ie they are all positive constants)
2657      so we can hardly say something about them.  */
2658   for (i = 1; i < phi_num_args; i++)
2659     if (pred != return_prediction (PHI_ARG_DEF (phi, i), &direction))
2660       break;
2661   if (i != phi_num_args)
2662     for (i = 0; i < phi_num_args; i++)
2663       {
2664         pred = return_prediction (PHI_ARG_DEF (phi, i), &direction);
2665         if (pred != PRED_NO_PREDICTION)
2666           predict_paths_leading_to_edge (gimple_phi_arg_edge (phi, i), pred,
2667                                          direction);
2668       }
2669 }
2670
2671 /* Look for basic block that contains unlikely to happen events
2672    (such as noreturn calls) and mark all paths leading to execution
2673    of this basic blocks as unlikely.  */
2674
2675 static void
2676 tree_bb_level_predictions (void)
2677 {
2678   basic_block bb;
2679   bool has_return_edges = false;
2680   edge e;
2681   edge_iterator ei;
2682
2683   FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
2684     if (!unlikely_executed_edge_p (e) && !(e->flags & EDGE_ABNORMAL_CALL))
2685       {
2686         has_return_edges = true;
2687         break;
2688       }
2689
2690   apply_return_prediction ();
2691
2692   FOR_EACH_BB_FN (bb, cfun)
2693     {
2694       gimple_stmt_iterator gsi;
2695
2696       for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2697         {
2698           gimple *stmt = gsi_stmt (gsi);
2699           tree decl;
2700
2701           if (is_gimple_call (stmt))
2702             {
2703               if (gimple_call_noreturn_p (stmt)
2704                   && has_return_edges
2705                   && !is_exit_with_zero_arg (stmt))
2706                 predict_paths_leading_to (bb, PRED_NORETURN,
2707                                           NOT_TAKEN);
2708               decl = gimple_call_fndecl (stmt);
2709               if (decl
2710                   && lookup_attribute ("cold",
2711                                        DECL_ATTRIBUTES (decl)))
2712                 predict_paths_leading_to (bb, PRED_COLD_FUNCTION,
2713                                           NOT_TAKEN);
2714               if (decl && recursive_call_p (current_function_decl, decl))
2715                 predict_paths_leading_to (bb, PRED_RECURSIVE_CALL,
2716                                           NOT_TAKEN);
2717             }
2718           else if (gimple_code (stmt) == GIMPLE_PREDICT)
2719             {
2720               predict_paths_leading_to (bb, gimple_predict_predictor (stmt),
2721                                         gimple_predict_outcome (stmt));
2722               /* Keep GIMPLE_PREDICT around so early inlining will propagate
2723                  hints to callers.  */
2724             }
2725         }
2726     }
2727 }
2728
2729 /* Callback for hash_map::traverse, asserts that the pointer map is
2730    empty.  */
2731
2732 bool
2733 assert_is_empty (const_basic_block const &, edge_prediction *const &value,
2734                  void *)
2735 {
2736   gcc_assert (!value);
2737   return false;
2738 }
2739
2740 /* Predict branch probabilities and estimate profile for basic block BB.
2741    When LOCAL_ONLY is set do not use any global properties of CFG.  */
2742
2743 static void
2744 tree_estimate_probability_bb (basic_block bb, bool local_only)
2745 {
2746   edge e;
2747   edge_iterator ei;
2748
2749   FOR_EACH_EDGE (e, ei, bb->succs)
2750     {
2751       /* Look for block we are guarding (ie we dominate it,
2752          but it doesn't postdominate us).  */
2753       if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun) && e->dest != bb
2754           && !local_only
2755           && dominated_by_p (CDI_DOMINATORS, e->dest, e->src)
2756           && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e->dest))
2757         {
2758           gimple_stmt_iterator bi;
2759
2760           /* The call heuristic claims that a guarded function call
2761              is improbable.  This is because such calls are often used
2762              to signal exceptional situations such as printing error
2763              messages.  */
2764           for (bi = gsi_start_bb (e->dest); !gsi_end_p (bi);
2765                gsi_next (&bi))
2766             {
2767               gimple *stmt = gsi_stmt (bi);
2768               if (is_gimple_call (stmt)
2769                   && !gimple_inexpensive_call_p (as_a <gcall *>  (stmt))
2770                   /* Constant and pure calls are hardly used to signalize
2771                      something exceptional.  */
2772                   && gimple_has_side_effects (stmt))
2773                 {
2774                   if (gimple_call_fndecl (stmt))
2775                     predict_edge_def (e, PRED_CALL, NOT_TAKEN);
2776                   else if (virtual_method_call_p (gimple_call_fn (stmt)))
2777                     predict_edge_def (e, PRED_POLYMORPHIC_CALL, NOT_TAKEN);
2778                   else
2779                     predict_edge_def (e, PRED_INDIR_CALL, TAKEN);
2780                   break;
2781                 }
2782             }
2783         }
2784     }
2785   tree_predict_by_opcode (bb);
2786 }
2787
2788 /* Predict branch probabilities and estimate profile of the tree CFG.
2789    This function can be called from the loop optimizers to recompute
2790    the profile information.
2791    If DRY_RUN is set, do not modify CFG and only produce dump files.  */
2792
2793 void
2794 tree_estimate_probability (bool dry_run)
2795 {
2796   basic_block bb;
2797
2798   add_noreturn_fake_exit_edges ();
2799   connect_infinite_loops_to_exit ();
2800   /* We use loop_niter_by_eval, which requires that the loops have
2801      preheaders.  */
2802   create_preheaders (CP_SIMPLE_PREHEADERS);
2803   calculate_dominance_info (CDI_POST_DOMINATORS);
2804
2805   bb_predictions = new hash_map<const_basic_block, edge_prediction *>;
2806   tree_bb_level_predictions ();
2807   record_loop_exits ();
2808
2809   if (number_of_loops (cfun) > 1)
2810     predict_loops ();
2811
2812   FOR_EACH_BB_FN (bb, cfun)
2813     tree_estimate_probability_bb (bb, false);
2814
2815   FOR_EACH_BB_FN (bb, cfun)
2816     combine_predictions_for_bb (bb, dry_run);
2817
2818   if (flag_checking)
2819     bb_predictions->traverse<void *, assert_is_empty> (NULL);
2820
2821   delete bb_predictions;
2822   bb_predictions = NULL;
2823
2824   if (!dry_run)
2825     estimate_bb_frequencies (false);
2826   free_dominance_info (CDI_POST_DOMINATORS);
2827   remove_fake_exit_edges ();
2828 }
2829
2830 /* Set edge->probability for each successor edge of BB.  */
2831 void
2832 tree_guess_outgoing_edge_probabilities (basic_block bb)
2833 {
2834   bb_predictions = new hash_map<const_basic_block, edge_prediction *>;
2835   tree_estimate_probability_bb (bb, true);
2836   combine_predictions_for_bb (bb, false);
2837   if (flag_checking)
2838     bb_predictions->traverse<void *, assert_is_empty> (NULL);
2839   delete bb_predictions;
2840   bb_predictions = NULL;
2841 }
2842 \f
2843 /* Predict edges to successors of CUR whose sources are not postdominated by
2844    BB by PRED and recurse to all postdominators.  */
2845
2846 static void
2847 predict_paths_for_bb (basic_block cur, basic_block bb,
2848                       enum br_predictor pred,
2849                       enum prediction taken,
2850                       bitmap visited, struct loop *in_loop = NULL)
2851 {
2852   edge e;
2853   edge_iterator ei;
2854   basic_block son;
2855
2856   /* If we exited the loop or CUR is unconditional in the loop, there is
2857      nothing to do.  */
2858   if (in_loop
2859       && (!flow_bb_inside_loop_p (in_loop, cur)
2860           || dominated_by_p (CDI_DOMINATORS, in_loop->latch, cur)))
2861     return;
2862
2863   /* We are looking for all edges forming edge cut induced by
2864      set of all blocks postdominated by BB.  */
2865   FOR_EACH_EDGE (e, ei, cur->preds)
2866     if (e->src->index >= NUM_FIXED_BLOCKS
2867         && !dominated_by_p (CDI_POST_DOMINATORS, e->src, bb))
2868     {
2869       edge e2;
2870       edge_iterator ei2;
2871       bool found = false;
2872
2873       /* Ignore fake edges and eh, we predict them as not taken anyway.  */
2874       if (unlikely_executed_edge_p (e))
2875         continue;
2876       gcc_assert (bb == cur || dominated_by_p (CDI_POST_DOMINATORS, cur, bb));
2877
2878       /* See if there is an edge from e->src that is not abnormal
2879          and does not lead to BB and does not exit the loop.  */
2880       FOR_EACH_EDGE (e2, ei2, e->src->succs)
2881         if (e2 != e
2882             && !unlikely_executed_edge_p (e2)
2883             && !dominated_by_p (CDI_POST_DOMINATORS, e2->dest, bb)
2884             && (!in_loop || !loop_exit_edge_p (in_loop, e2)))
2885           {
2886             found = true;
2887             break;
2888           }
2889
2890       /* If there is non-abnormal path leaving e->src, predict edge
2891          using predictor.  Otherwise we need to look for paths
2892          leading to e->src.
2893
2894          The second may lead to infinite loop in the case we are predicitng
2895          regions that are only reachable by abnormal edges.  We simply
2896          prevent visiting given BB twice.  */
2897       if (found)
2898         {
2899           if (!edge_predicted_by_p (e, pred, taken))
2900             predict_edge_def (e, pred, taken);
2901         }
2902       else if (bitmap_set_bit (visited, e->src->index))
2903         predict_paths_for_bb (e->src, e->src, pred, taken, visited, in_loop);
2904     }
2905   for (son = first_dom_son (CDI_POST_DOMINATORS, cur);
2906        son;
2907        son = next_dom_son (CDI_POST_DOMINATORS, son))
2908     predict_paths_for_bb (son, bb, pred, taken, visited, in_loop);
2909 }
2910
2911 /* Sets branch probabilities according to PREDiction and
2912    FLAGS.  */
2913
2914 static void
2915 predict_paths_leading_to (basic_block bb, enum br_predictor pred,
2916                           enum prediction taken, struct loop *in_loop)
2917 {
2918   predict_paths_for_bb (bb, bb, pred, taken, auto_bitmap (), in_loop);
2919 }
2920
2921 /* Like predict_paths_leading_to but take edge instead of basic block.  */
2922
2923 static void
2924 predict_paths_leading_to_edge (edge e, enum br_predictor pred,
2925                                enum prediction taken, struct loop *in_loop)
2926 {
2927   bool has_nonloop_edge = false;
2928   edge_iterator ei;
2929   edge e2;
2930
2931   basic_block bb = e->src;
2932   FOR_EACH_EDGE (e2, ei, bb->succs)
2933     if (e2->dest != e->src && e2->dest != e->dest
2934         && !unlikely_executed_edge_p (e)
2935         && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e2->dest))
2936       {
2937         has_nonloop_edge = true;
2938         break;
2939       }
2940   if (!has_nonloop_edge)
2941     {
2942       predict_paths_for_bb (bb, bb, pred, taken, auto_bitmap (), in_loop);
2943     }
2944   else
2945     predict_edge_def (e, pred, taken);
2946 }
2947 \f
2948 /* This is used to carry information about basic blocks.  It is
2949    attached to the AUX field of the standard CFG block.  */
2950
2951 struct block_info
2952 {
2953   /* Estimated frequency of execution of basic_block.  */
2954   sreal frequency;
2955
2956   /* To keep queue of basic blocks to process.  */
2957   basic_block next;
2958
2959   /* Number of predecessors we need to visit first.  */
2960   int npredecessors;
2961 };
2962
2963 /* Similar information for edges.  */
2964 struct edge_prob_info
2965 {
2966   /* In case edge is a loopback edge, the probability edge will be reached
2967      in case header is.  Estimated number of iterations of the loop can be
2968      then computed as 1 / (1 - back_edge_prob).  */
2969   sreal back_edge_prob;
2970   /* True if the edge is a loopback edge in the natural loop.  */
2971   unsigned int back_edge:1;
2972 };
2973
2974 #define BLOCK_INFO(B)   ((block_info *) (B)->aux)
2975 #undef EDGE_INFO
2976 #define EDGE_INFO(E)    ((edge_prob_info *) (E)->aux)
2977
2978 /* Helper function for estimate_bb_frequencies.
2979    Propagate the frequencies in blocks marked in
2980    TOVISIT, starting in HEAD.  */
2981
2982 static void
2983 propagate_freq (basic_block head, bitmap tovisit)
2984 {
2985   basic_block bb;
2986   basic_block last;
2987   unsigned i;
2988   edge e;
2989   basic_block nextbb;
2990   bitmap_iterator bi;
2991
2992   /* For each basic block we need to visit count number of his predecessors
2993      we need to visit first.  */
2994   EXECUTE_IF_SET_IN_BITMAP (tovisit, 0, i, bi)
2995     {
2996       edge_iterator ei;
2997       int count = 0;
2998
2999       bb = BASIC_BLOCK_FOR_FN (cfun, i);
3000
3001       FOR_EACH_EDGE (e, ei, bb->preds)
3002         {
3003           bool visit = bitmap_bit_p (tovisit, e->src->index);
3004
3005           if (visit && !(e->flags & EDGE_DFS_BACK))
3006             count++;
3007           else if (visit && dump_file && !EDGE_INFO (e)->back_edge)
3008             fprintf (dump_file,
3009                      "Irreducible region hit, ignoring edge to %i->%i\n",
3010                      e->src->index, bb->index);
3011         }
3012       BLOCK_INFO (bb)->npredecessors = count;
3013       /* When function never returns, we will never process exit block.  */
3014       if (!count && bb == EXIT_BLOCK_PTR_FOR_FN (cfun))
3015         {
3016           bb->count = profile_count::zero ();
3017           bb->frequency = 0;
3018         }
3019     }
3020
3021   BLOCK_INFO (head)->frequency = 1;
3022   last = head;
3023   for (bb = head; bb; bb = nextbb)
3024     {
3025       edge_iterator ei;
3026       sreal cyclic_probability = 0;
3027       sreal frequency = 0;
3028
3029       nextbb = BLOCK_INFO (bb)->next;
3030       BLOCK_INFO (bb)->next = NULL;
3031
3032       /* Compute frequency of basic block.  */
3033       if (bb != head)
3034         {
3035           if (flag_checking)
3036             FOR_EACH_EDGE (e, ei, bb->preds)
3037               gcc_assert (!bitmap_bit_p (tovisit, e->src->index)
3038                           || (e->flags & EDGE_DFS_BACK));
3039
3040           FOR_EACH_EDGE (e, ei, bb->preds)
3041             if (EDGE_INFO (e)->back_edge)
3042               {
3043                 cyclic_probability += EDGE_INFO (e)->back_edge_prob;
3044               }
3045             else if (!(e->flags & EDGE_DFS_BACK))
3046               {
3047                 /*  frequency += (e->probability
3048                                   * BLOCK_INFO (e->src)->frequency /
3049                                   REG_BR_PROB_BASE);  */
3050
3051                 sreal tmp = e->probability.to_reg_br_prob_base ();
3052                 tmp *= BLOCK_INFO (e->src)->frequency;
3053                 tmp *= real_inv_br_prob_base;
3054                 frequency += tmp;
3055               }
3056
3057           if (cyclic_probability == 0)
3058             {
3059               BLOCK_INFO (bb)->frequency = frequency;
3060             }
3061           else
3062             {
3063               if (cyclic_probability > real_almost_one)
3064                 cyclic_probability = real_almost_one;
3065
3066               /* BLOCK_INFO (bb)->frequency = frequency
3067                                               / (1 - cyclic_probability) */
3068
3069               cyclic_probability = sreal (1) - cyclic_probability;
3070               BLOCK_INFO (bb)->frequency = frequency / cyclic_probability;
3071             }
3072         }
3073
3074       bitmap_clear_bit (tovisit, bb->index);
3075
3076       e = find_edge (bb, head);
3077       if (e)
3078         {
3079           /* EDGE_INFO (e)->back_edge_prob
3080              = ((e->probability * BLOCK_INFO (bb)->frequency)
3081              / REG_BR_PROB_BASE); */
3082
3083           sreal tmp = e->probability.to_reg_br_prob_base ();
3084           tmp *= BLOCK_INFO (bb)->frequency;
3085           EDGE_INFO (e)->back_edge_prob = tmp * real_inv_br_prob_base;
3086         }
3087
3088       /* Propagate to successor blocks.  */
3089       FOR_EACH_EDGE (e, ei, bb->succs)
3090         if (!(e->flags & EDGE_DFS_BACK)
3091             && BLOCK_INFO (e->dest)->npredecessors)
3092           {
3093             BLOCK_INFO (e->dest)->npredecessors--;
3094             if (!BLOCK_INFO (e->dest)->npredecessors)
3095               {
3096                 if (!nextbb)
3097                   nextbb = e->dest;
3098                 else
3099                   BLOCK_INFO (last)->next = e->dest;
3100
3101                 last = e->dest;
3102               }
3103           }
3104     }
3105 }
3106
3107 /* Estimate frequencies in loops at same nest level.  */
3108
3109 static void
3110 estimate_loops_at_level (struct loop *first_loop)
3111 {
3112   struct loop *loop;
3113
3114   for (loop = first_loop; loop; loop = loop->next)
3115     {
3116       edge e;
3117       basic_block *bbs;
3118       unsigned i;
3119       auto_bitmap tovisit;
3120
3121       estimate_loops_at_level (loop->inner);
3122
3123       /* Find current loop back edge and mark it.  */
3124       e = loop_latch_edge (loop);
3125       EDGE_INFO (e)->back_edge = 1;
3126
3127       bbs = get_loop_body (loop);
3128       for (i = 0; i < loop->num_nodes; i++)
3129         bitmap_set_bit (tovisit, bbs[i]->index);
3130       free (bbs);
3131       propagate_freq (loop->header, tovisit);
3132     }
3133 }
3134
3135 /* Propagates frequencies through structure of loops.  */
3136
3137 static void
3138 estimate_loops (void)
3139 {
3140   auto_bitmap tovisit;
3141   basic_block bb;
3142
3143   /* Start by estimating the frequencies in the loops.  */
3144   if (number_of_loops (cfun) > 1)
3145     estimate_loops_at_level (current_loops->tree_root->inner);
3146
3147   /* Now propagate the frequencies through all the blocks.  */
3148   FOR_ALL_BB_FN (bb, cfun)
3149     {
3150       bitmap_set_bit (tovisit, bb->index);
3151     }
3152   propagate_freq (ENTRY_BLOCK_PTR_FOR_FN (cfun), tovisit);
3153 }
3154
3155 /* Drop the profile for NODE to guessed, and update its frequency based on
3156    whether it is expected to be hot given the CALL_COUNT.  */
3157
3158 static void
3159 drop_profile (struct cgraph_node *node, profile_count call_count)
3160 {
3161   struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
3162   /* In the case where this was called by another function with a
3163      dropped profile, call_count will be 0. Since there are no
3164      non-zero call counts to this function, we don't know for sure
3165      whether it is hot, and therefore it will be marked normal below.  */
3166   bool hot = maybe_hot_count_p (NULL, call_count);
3167
3168   if (dump_file)
3169     fprintf (dump_file,
3170              "Dropping 0 profile for %s. %s based on calls.\n",
3171              node->dump_name (),
3172              hot ? "Function is hot" : "Function is normal");
3173   /* We only expect to miss profiles for functions that are reached
3174      via non-zero call edges in cases where the function may have
3175      been linked from another module or library (COMDATs and extern
3176      templates). See the comments below for handle_missing_profiles.
3177      Also, only warn in cases where the missing counts exceed the
3178      number of training runs. In certain cases with an execv followed
3179      by a no-return call the profile for the no-return call is not
3180      dumped and there can be a mismatch.  */
3181   if (!DECL_COMDAT (node->decl) && !DECL_EXTERNAL (node->decl)
3182       && call_count > profile_info->runs)
3183     {
3184       if (flag_profile_correction)
3185         {
3186           if (dump_file)
3187             fprintf (dump_file,
3188                      "Missing counts for called function %s\n",
3189                      node->dump_name ());
3190         }
3191       else
3192         warning (0, "Missing counts for called function %s",
3193                  node->dump_name ());
3194     }
3195
3196   basic_block bb;
3197   FOR_ALL_BB_FN (bb, fn)
3198     {
3199       bb->count = profile_count::uninitialized ();
3200
3201       edge_iterator ei;
3202       edge e;
3203       FOR_EACH_EDGE (e, ei, bb->preds)
3204         e->count = profile_count::uninitialized ();
3205     }
3206
3207   struct cgraph_edge *e;
3208   for (e = node->callees; e; e = e->next_caller)
3209     {
3210       e->count = profile_count::uninitialized ();
3211       e->frequency = compute_call_stmt_bb_frequency (e->caller->decl,
3212                                                      gimple_bb (e->call_stmt));
3213     }
3214   node->count = profile_count::uninitialized ();
3215
3216   profile_status_for_fn (fn)
3217       = (flag_guess_branch_prob ? PROFILE_GUESSED : PROFILE_ABSENT);
3218   node->frequency
3219       = hot ? NODE_FREQUENCY_HOT : NODE_FREQUENCY_NORMAL;
3220 }
3221
3222 /* In the case of COMDAT routines, multiple object files will contain the same
3223    function and the linker will select one for the binary. In that case
3224    all the other copies from the profile instrument binary will be missing
3225    profile counts. Look for cases where this happened, due to non-zero
3226    call counts going to 0-count functions, and drop the profile to guessed
3227    so that we can use the estimated probabilities and avoid optimizing only
3228    for size.
3229
3230    The other case where the profile may be missing is when the routine
3231    is not going to be emitted to the object file, e.g. for "extern template"
3232    class methods. Those will be marked DECL_EXTERNAL. Emit a warning in
3233    all other cases of non-zero calls to 0-count functions.  */
3234
3235 void
3236 handle_missing_profiles (void)
3237 {
3238   struct cgraph_node *node;
3239   int unlikely_count_fraction = PARAM_VALUE (UNLIKELY_BB_COUNT_FRACTION);
3240   auto_vec<struct cgraph_node *, 64> worklist;
3241
3242   /* See if 0 count function has non-0 count callers.  In this case we
3243      lost some profile.  Drop its function profile to PROFILE_GUESSED.  */
3244   FOR_EACH_DEFINED_FUNCTION (node)
3245     {
3246       struct cgraph_edge *e;
3247       profile_count call_count = profile_count::zero ();
3248       gcov_type max_tp_first_run = 0;
3249       struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
3250
3251       if (!(node->count == profile_count::zero ()))
3252         continue;
3253       for (e = node->callers; e; e = e->next_caller)
3254         if (e->count.initialized_p () && e->count > 0)
3255           {
3256             call_count = call_count + e->count;
3257
3258             if (e->caller->tp_first_run > max_tp_first_run)
3259               max_tp_first_run = e->caller->tp_first_run;
3260           }
3261
3262       /* If time profile is missing, let assign the maximum that comes from
3263          caller functions.  */
3264       if (!node->tp_first_run && max_tp_first_run)
3265         node->tp_first_run = max_tp_first_run + 1;
3266
3267       if (call_count > 0
3268           && fn && fn->cfg
3269           && (call_count.apply_scale (unlikely_count_fraction, 1)
3270               >= profile_info->runs))
3271         {
3272           drop_profile (node, call_count);
3273           worklist.safe_push (node);
3274         }
3275     }
3276
3277   /* Propagate the profile dropping to other 0-count COMDATs that are
3278      potentially called by COMDATs we already dropped the profile on.  */
3279   while (worklist.length () > 0)
3280     {
3281       struct cgraph_edge *e;
3282
3283       node = worklist.pop ();
3284       for (e = node->callees; e; e = e->next_caller)
3285         {
3286           struct cgraph_node *callee = e->callee;
3287           struct function *fn = DECL_STRUCT_FUNCTION (callee->decl);
3288
3289           if (callee->count > 0)
3290             continue;
3291           if ((DECL_COMDAT (callee->decl) || DECL_EXTERNAL (callee->decl))
3292               && fn && fn->cfg
3293               && profile_status_for_fn (fn) == PROFILE_READ)
3294             {
3295               drop_profile (node, profile_count::zero ());
3296               worklist.safe_push (callee);
3297             }
3298         }
3299     }
3300 }
3301
3302 /* Convert counts measured by profile driven feedback to frequencies.
3303    Return nonzero iff there was any nonzero execution count.  */
3304
3305 bool
3306 counts_to_freqs (void)
3307 {
3308   gcov_type count_max;
3309   profile_count true_count_max = profile_count::zero ();
3310   basic_block bb;
3311
3312   /* Don't overwrite the estimated frequencies when the profile for
3313      the function is missing.  We may drop this function PROFILE_GUESSED
3314      later in drop_profile ().  */
3315   if (!ENTRY_BLOCK_PTR_FOR_FN (cfun)->count.initialized_p ()
3316       || ENTRY_BLOCK_PTR_FOR_FN (cfun)->count == profile_count::zero ())
3317     return false;
3318
3319   FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3320     if (bb->count > true_count_max)
3321       true_count_max = bb->count;
3322
3323   /* If we have no counts to base frequencies on, keep those that are
3324      already there.  */
3325   if (!(true_count_max > 0))
3326     return false;
3327
3328   count_max = true_count_max.to_gcov_type ();
3329
3330   FOR_ALL_BB_FN (bb, cfun)
3331     if (bb->count.initialized_p ())
3332       bb->frequency = RDIV (bb->count.to_gcov_type () * BB_FREQ_MAX, count_max);
3333
3334   return true;
3335 }
3336
3337 /* Return true if function is likely to be expensive, so there is no point to
3338    optimize performance of prologue, epilogue or do inlining at the expense
3339    of code size growth.  THRESHOLD is the limit of number of instructions
3340    function can execute at average to be still considered not expensive.  */
3341
3342 bool
3343 expensive_function_p (int threshold)
3344 {
3345   unsigned int sum = 0;
3346   basic_block bb;
3347   unsigned int limit;
3348
3349   /* We can not compute accurately for large thresholds due to scaled
3350      frequencies.  */
3351   gcc_assert (threshold <= BB_FREQ_MAX);
3352
3353   /* Frequencies are out of range.  This either means that function contains
3354      internal loop executing more than BB_FREQ_MAX times or profile feedback
3355      is available and function has not been executed at all.  */
3356   if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency == 0)
3357     return true;
3358
3359   /* Maximally BB_FREQ_MAX^2 so overflow won't happen.  */
3360   limit = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency * threshold;
3361   FOR_EACH_BB_FN (bb, cfun)
3362     {
3363       rtx_insn *insn;
3364
3365       FOR_BB_INSNS (bb, insn)
3366         if (active_insn_p (insn))
3367           {
3368             sum += bb->frequency;
3369             if (sum > limit)
3370               return true;
3371         }
3372     }
3373
3374   return false;
3375 }
3376
3377 /* All basic blocks that are reachable only from unlikely basic blocks are
3378    unlikely.  */
3379
3380 void
3381 propagate_unlikely_bbs_forward (void)
3382 {
3383   auto_vec<basic_block, 64> worklist;
3384   basic_block bb;
3385   edge_iterator ei;
3386   edge e;
3387
3388   if (!(ENTRY_BLOCK_PTR_FOR_FN (cfun)->count == profile_count::zero ()))
3389     {
3390       ENTRY_BLOCK_PTR_FOR_FN (cfun)->aux = (void *)(size_t) 1;
3391       worklist.safe_push (ENTRY_BLOCK_PTR_FOR_FN (cfun));
3392
3393       while (worklist.length () > 0)
3394         {
3395           bb = worklist.pop ();
3396           FOR_EACH_EDGE (e, ei, bb->succs)
3397             if (!(e->count == profile_count::zero ())
3398                 && !(e->dest->count == profile_count::zero ())
3399                 && !e->dest->aux)
3400               {
3401                 e->dest->aux = (void *)(size_t) 1;
3402                 worklist.safe_push (e->dest);
3403               }
3404         }
3405     }
3406
3407   FOR_ALL_BB_FN (bb, cfun)
3408     {
3409       if (!bb->aux)
3410         {
3411           if (!(bb->count == profile_count::zero ())
3412               && (dump_file && (dump_flags & TDF_DETAILS)))
3413             fprintf (dump_file,
3414                      "Basic block %i is marked unlikely by forward prop\n",
3415                      bb->index);
3416           bb->count = profile_count::zero ();
3417           bb->frequency = 0;
3418           FOR_EACH_EDGE (e, ei, bb->succs)
3419             e->count = profile_count::zero ();
3420         }
3421       else
3422         bb->aux = NULL;
3423     }
3424 }
3425
3426 /* Determine basic blocks/edges that are known to be unlikely executed and set
3427    their counters to zero.
3428    This is done with first identifying obviously unlikely BBs/edges and then
3429    propagating in both directions.  */
3430
3431 static void
3432 determine_unlikely_bbs ()
3433 {
3434   basic_block bb;
3435   auto_vec<basic_block, 64> worklist;
3436   edge_iterator ei;
3437   edge e;
3438
3439   FOR_EACH_BB_FN (bb, cfun)
3440     {
3441       if (!(bb->count == profile_count::zero ())
3442           && unlikely_executed_bb_p (bb))
3443         {
3444           if (dump_file && (dump_flags & TDF_DETAILS))
3445             fprintf (dump_file, "Basic block %i is locally unlikely\n",
3446                      bb->index);
3447           bb->count = profile_count::zero ();
3448         }
3449
3450       if (bb->count == profile_count::zero ())
3451         {
3452           bb->frequency = 0;
3453           FOR_EACH_EDGE (e, ei, bb->preds)
3454             e->count = profile_count::zero ();
3455         }
3456
3457       FOR_EACH_EDGE (e, ei, bb->succs)
3458         if (!(e->count == profile_count::zero ())
3459             && unlikely_executed_edge_p (e))
3460           {
3461             if (dump_file && (dump_flags & TDF_DETAILS))
3462               fprintf (dump_file, "Edge %i->%i is locally unlikely\n",
3463                        bb->index, e->dest->index);
3464             e->count = profile_count::zero ();
3465           }
3466
3467       gcc_checking_assert (!bb->aux);
3468     }
3469
3470   auto_vec<int, 64> nsuccs;
3471   nsuccs.safe_grow_cleared (last_basic_block_for_fn (cfun));
3472   FOR_ALL_BB_FN (bb, cfun)
3473     if (!(bb->count == profile_count::zero ())
3474         && bb != EXIT_BLOCK_PTR_FOR_FN (cfun))
3475       {
3476         nsuccs[bb->index] = 0;
3477         FOR_EACH_EDGE (e, ei, bb->succs)
3478           if (!(e->count == profile_count::zero ()))
3479             nsuccs[bb->index]++;
3480         if (!nsuccs[bb->index])
3481           worklist.safe_push (bb);
3482       }
3483   while (worklist.length () > 0)
3484     {
3485       bb = worklist.pop ();
3486       if (bb != ENTRY_BLOCK_PTR_FOR_FN (cfun))
3487         {
3488           bool found = false;
3489           for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
3490                !gsi_end_p (gsi); gsi_next (&gsi))
3491             if (stmt_can_terminate_bb_p (gsi_stmt (gsi))
3492                 /* stmt_can_terminate_bb_p special cases noreturns because it
3493                    assumes that fake edges are created.  We want to know that
3494                    noreturn alone does not imply BB to be unlikely.  */
3495                 || (is_gimple_call (gsi_stmt (gsi))
3496                     && (gimple_call_flags (gsi_stmt (gsi)) & ECF_NORETURN)))
3497               {
3498                 found = true;
3499                 break;
3500               }
3501           if (found)
3502             continue;
3503         }
3504       if (!(bb->count == profile_count::zero ())
3505           && (dump_file && (dump_flags & TDF_DETAILS)))
3506         fprintf (dump_file,
3507                  "Basic block %i is marked unlikely by backward prop\n",
3508                  bb->index);
3509       bb->count = profile_count::zero ();
3510       bb->frequency = 0;
3511       FOR_EACH_EDGE (e, ei, bb->preds)
3512         if (!(e->count == profile_count::zero ()))
3513           {
3514             e->count = profile_count::zero ();
3515             if (!(e->src->count == profile_count::zero ()))
3516               {
3517                 nsuccs[e->src->index]--;
3518                 if (!nsuccs[e->src->index])
3519                   worklist.safe_push (e->src);
3520               }
3521           }
3522     }
3523 }
3524
3525 /* Estimate and propagate basic block frequencies using the given branch
3526    probabilities.  If FORCE is true, the frequencies are used to estimate
3527    the counts even when there are already non-zero profile counts.  */
3528
3529 void
3530 estimate_bb_frequencies (bool force)
3531 {
3532   basic_block bb;
3533   sreal freq_max;
3534
3535   determine_unlikely_bbs ();
3536
3537   if (force || profile_status_for_fn (cfun) != PROFILE_READ
3538       || !counts_to_freqs ())
3539     {
3540       static int real_values_initialized = 0;
3541
3542       if (!real_values_initialized)
3543         {
3544           real_values_initialized = 1;
3545           real_br_prob_base = REG_BR_PROB_BASE;
3546           real_bb_freq_max = BB_FREQ_MAX;
3547           real_one_half = sreal (1, -1);
3548           real_inv_br_prob_base = sreal (1) / real_br_prob_base;
3549           real_almost_one = sreal (1) - real_inv_br_prob_base;
3550         }
3551
3552       mark_dfs_back_edges ();
3553
3554       single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun))->probability =
3555          profile_probability::always ();
3556
3557       /* Set up block info for each basic block.  */
3558       alloc_aux_for_blocks (sizeof (block_info));
3559       alloc_aux_for_edges (sizeof (edge_prob_info));
3560       FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3561         {
3562           edge e;
3563           edge_iterator ei;
3564
3565           FOR_EACH_EDGE (e, ei, bb->succs)
3566             {
3567               EDGE_INFO (e)->back_edge_prob
3568                  = e->probability.to_reg_br_prob_base ();
3569               EDGE_INFO (e)->back_edge_prob *= real_inv_br_prob_base;
3570             }
3571         }
3572
3573       /* First compute frequencies locally for each loop from innermost
3574          to outermost to examine frequencies for back edges.  */
3575       estimate_loops ();
3576
3577       freq_max = 0;
3578       FOR_EACH_BB_FN (bb, cfun)
3579         if (freq_max < BLOCK_INFO (bb)->frequency)
3580           freq_max = BLOCK_INFO (bb)->frequency;
3581
3582       freq_max = real_bb_freq_max / freq_max;
3583       FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3584         {
3585           sreal tmp = BLOCK_INFO (bb)->frequency * freq_max + real_one_half;
3586           bb->frequency = tmp.to_int ();
3587         }
3588
3589       free_aux_for_blocks ();
3590       free_aux_for_edges ();
3591     }
3592   compute_function_frequency ();
3593 }
3594
3595 /* Decide whether function is hot, cold or unlikely executed.  */
3596 void
3597 compute_function_frequency (void)
3598 {
3599   basic_block bb;
3600   struct cgraph_node *node = cgraph_node::get (current_function_decl);
3601
3602   if (DECL_STATIC_CONSTRUCTOR (current_function_decl)
3603       || MAIN_NAME_P (DECL_NAME (current_function_decl)))
3604     node->only_called_at_startup = true;
3605   if (DECL_STATIC_DESTRUCTOR (current_function_decl))
3606     node->only_called_at_exit = true;
3607
3608   if (profile_status_for_fn (cfun) != PROFILE_READ)
3609     {
3610       int flags = flags_from_decl_or_type (current_function_decl);
3611       if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->count == profile_count::zero ()
3612           || lookup_attribute ("cold", DECL_ATTRIBUTES (current_function_decl))
3613              != NULL)
3614         node->frequency = NODE_FREQUENCY_UNLIKELY_EXECUTED;
3615       else if (lookup_attribute ("hot", DECL_ATTRIBUTES (current_function_decl))
3616                != NULL)
3617         node->frequency = NODE_FREQUENCY_HOT;
3618       else if (flags & ECF_NORETURN)
3619         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3620       else if (MAIN_NAME_P (DECL_NAME (current_function_decl)))
3621         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3622       else if (DECL_STATIC_CONSTRUCTOR (current_function_decl)
3623                || DECL_STATIC_DESTRUCTOR (current_function_decl))
3624         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3625       return;
3626     }
3627
3628   /* Only first time try to drop function into unlikely executed.
3629      After inlining the roundoff errors may confuse us.
3630      Ipa-profile pass will drop functions only called from unlikely
3631      functions to unlikely and that is most of what we care about.  */
3632   if (!cfun->after_inlining)
3633     node->frequency = NODE_FREQUENCY_UNLIKELY_EXECUTED;
3634   FOR_EACH_BB_FN (bb, cfun)
3635     {
3636       if (maybe_hot_bb_p (cfun, bb))
3637         {
3638           node->frequency = NODE_FREQUENCY_HOT;
3639           return;
3640         }
3641       if (!probably_never_executed_bb_p (cfun, bb))
3642         node->frequency = NODE_FREQUENCY_NORMAL;
3643     }
3644 }
3645
3646 /* Build PREDICT_EXPR.  */
3647 tree
3648 build_predict_expr (enum br_predictor predictor, enum prediction taken)
3649 {
3650   tree t = build1 (PREDICT_EXPR, void_type_node,
3651                    build_int_cst (integer_type_node, predictor));
3652   SET_PREDICT_EXPR_OUTCOME (t, taken);
3653   return t;
3654 }
3655
3656 const char *
3657 predictor_name (enum br_predictor predictor)
3658 {
3659   return predictor_info[predictor].name;
3660 }
3661
3662 /* Predict branch probabilities and estimate profile of the tree CFG. */
3663
3664 namespace {
3665
3666 const pass_data pass_data_profile =
3667 {
3668   GIMPLE_PASS, /* type */
3669   "profile_estimate", /* name */
3670   OPTGROUP_NONE, /* optinfo_flags */
3671   TV_BRANCH_PROB, /* tv_id */
3672   PROP_cfg, /* properties_required */
3673   0, /* properties_provided */
3674   0, /* properties_destroyed */
3675   0, /* todo_flags_start */
3676   0, /* todo_flags_finish */
3677 };
3678
3679 class pass_profile : public gimple_opt_pass
3680 {
3681 public:
3682   pass_profile (gcc::context *ctxt)
3683     : gimple_opt_pass (pass_data_profile, ctxt)
3684   {}
3685
3686   /* opt_pass methods: */
3687   virtual bool gate (function *) { return flag_guess_branch_prob; }
3688   virtual unsigned int execute (function *);
3689
3690 }; // class pass_profile
3691
3692 unsigned int
3693 pass_profile::execute (function *fun)
3694 {
3695   unsigned nb_loops;
3696
3697   if (profile_status_for_fn (cfun) == PROFILE_GUESSED)
3698     return 0;
3699
3700   loop_optimizer_init (LOOPS_NORMAL);
3701   if (dump_file && (dump_flags & TDF_DETAILS))
3702     flow_loops_dump (dump_file, NULL, 0);
3703
3704   mark_irreducible_loops ();
3705
3706   nb_loops = number_of_loops (fun);
3707   if (nb_loops > 1)
3708     scev_initialize ();
3709
3710   tree_estimate_probability (false);
3711
3712   if (nb_loops > 1)
3713     scev_finalize ();
3714
3715   loop_optimizer_finalize ();
3716   if (dump_file && (dump_flags & TDF_DETAILS))
3717     gimple_dump_cfg (dump_file, dump_flags);
3718  if (profile_status_for_fn (fun) == PROFILE_ABSENT)
3719     profile_status_for_fn (fun) = PROFILE_GUESSED;
3720  if (dump_file && (dump_flags & TDF_DETAILS))
3721    {
3722      struct loop *loop;
3723      FOR_EACH_LOOP (loop, LI_FROM_INNERMOST)
3724        if (loop->header->frequency)
3725          fprintf (dump_file, "Loop got predicted %d to iterate %i times.\n",
3726            loop->num,
3727            (int)expected_loop_iterations_unbounded (loop));
3728    }
3729   return 0;
3730 }
3731
3732 } // anon namespace
3733
3734 gimple_opt_pass *
3735 make_pass_profile (gcc::context *ctxt)
3736 {
3737   return new pass_profile (ctxt);
3738 }
3739
3740 namespace {
3741
3742 const pass_data pass_data_strip_predict_hints =
3743 {
3744   GIMPLE_PASS, /* type */
3745   "*strip_predict_hints", /* name */
3746   OPTGROUP_NONE, /* optinfo_flags */
3747   TV_BRANCH_PROB, /* tv_id */
3748   PROP_cfg, /* properties_required */
3749   0, /* properties_provided */
3750   0, /* properties_destroyed */
3751   0, /* todo_flags_start */
3752   0, /* todo_flags_finish */
3753 };
3754
3755 class pass_strip_predict_hints : public gimple_opt_pass
3756 {
3757 public:
3758   pass_strip_predict_hints (gcc::context *ctxt)
3759     : gimple_opt_pass (pass_data_strip_predict_hints, ctxt)
3760   {}
3761
3762   /* opt_pass methods: */
3763   opt_pass * clone () { return new pass_strip_predict_hints (m_ctxt); }
3764   virtual unsigned int execute (function *);
3765
3766 }; // class pass_strip_predict_hints
3767
3768 /* Get rid of all builtin_expect calls and GIMPLE_PREDICT statements
3769    we no longer need.  */
3770 unsigned int
3771 pass_strip_predict_hints::execute (function *fun)
3772 {
3773   basic_block bb;
3774   gimple *ass_stmt;
3775   tree var;
3776   bool changed = false;
3777
3778   FOR_EACH_BB_FN (bb, fun)
3779     {
3780       gimple_stmt_iterator bi;
3781       for (bi = gsi_start_bb (bb); !gsi_end_p (bi);)
3782         {
3783           gimple *stmt = gsi_stmt (bi);
3784
3785           if (gimple_code (stmt) == GIMPLE_PREDICT)
3786             {
3787               gsi_remove (&bi, true);
3788               changed = true;
3789               continue;
3790             }
3791           else if (is_gimple_call (stmt))
3792             {
3793               tree fndecl = gimple_call_fndecl (stmt);
3794
3795               if ((fndecl
3796                    && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL
3797                    && DECL_FUNCTION_CODE (fndecl) == BUILT_IN_EXPECT
3798                    && gimple_call_num_args (stmt) == 2)
3799                   || (gimple_call_internal_p (stmt)
3800                       && gimple_call_internal_fn (stmt) == IFN_BUILTIN_EXPECT))
3801                 {
3802                   var = gimple_call_lhs (stmt);
3803                   changed = true;
3804                   if (var)
3805                     {
3806                       ass_stmt
3807                         = gimple_build_assign (var, gimple_call_arg (stmt, 0));
3808                       gsi_replace (&bi, ass_stmt, true);
3809                     }
3810                   else
3811                     {
3812                       gsi_remove (&bi, true);
3813                       continue;
3814                     }
3815                 }
3816             }
3817           gsi_next (&bi);
3818         }
3819     }
3820   return changed ? TODO_cleanup_cfg : 0;
3821 }
3822
3823 } // anon namespace
3824
3825 gimple_opt_pass *
3826 make_pass_strip_predict_hints (gcc::context *ctxt)
3827 {
3828   return new pass_strip_predict_hints (ctxt);
3829 }
3830
3831 /* Rebuild function frequencies.  Passes are in general expected to
3832    maintain profile by hand, however in some cases this is not possible:
3833    for example when inlining several functions with loops freuqencies might run
3834    out of scale and thus needs to be recomputed.  */
3835
3836 void
3837 rebuild_frequencies (void)
3838 {
3839   timevar_push (TV_REBUILD_FREQUENCIES);
3840
3841   /* When the max bb count in the function is small, there is a higher
3842      chance that there were truncation errors in the integer scaling
3843      of counts by inlining and other optimizations. This could lead
3844      to incorrect classification of code as being cold when it isn't.
3845      In that case, force the estimation of bb counts/frequencies from the
3846      branch probabilities, rather than computing frequencies from counts,
3847      which may also lead to frequencies incorrectly reduced to 0. There
3848      is less precision in the probabilities, so we only do this for small
3849      max counts.  */
3850   profile_count count_max = profile_count::zero ();
3851   basic_block bb;
3852   FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3853     if (bb->count > count_max)
3854       count_max = bb->count;
3855
3856   if (profile_status_for_fn (cfun) == PROFILE_GUESSED
3857       || (!flag_auto_profile && profile_status_for_fn (cfun) == PROFILE_READ
3858           && count_max < REG_BR_PROB_BASE / 10))
3859     {
3860       loop_optimizer_init (0);
3861       add_noreturn_fake_exit_edges ();
3862       mark_irreducible_loops ();
3863       connect_infinite_loops_to_exit ();
3864       estimate_bb_frequencies (true);
3865       remove_fake_exit_edges ();
3866       loop_optimizer_finalize ();
3867     }
3868   else if (profile_status_for_fn (cfun) == PROFILE_READ)
3869     counts_to_freqs ();
3870   else
3871     gcc_unreachable ();
3872   timevar_pop (TV_REBUILD_FREQUENCIES);
3873 }
3874
3875 /* Perform a dry run of the branch prediction pass and report comparsion of
3876    the predicted and real profile into the dump file.  */
3877
3878 void
3879 report_predictor_hitrates (void)
3880 {
3881   unsigned nb_loops;
3882
3883   loop_optimizer_init (LOOPS_NORMAL);
3884   if (dump_file && (dump_flags & TDF_DETAILS))
3885     flow_loops_dump (dump_file, NULL, 0);
3886
3887   mark_irreducible_loops ();
3888
3889   nb_loops = number_of_loops (cfun);
3890   if (nb_loops > 1)
3891     scev_initialize ();
3892
3893   tree_estimate_probability (true);
3894
3895   if (nb_loops > 1)
3896     scev_finalize ();
3897
3898   loop_optimizer_finalize ();
3899 }
3900
3901 /* Force edge E to be cold.
3902    If IMPOSSIBLE is true, for edge to have count and probability 0 otherwise
3903    keep low probability to represent possible error in a guess.  This is used
3904    i.e. in case we predict loop to likely iterate given number of times but
3905    we are not 100% sure.
3906
3907    This function locally updates profile without attempt to keep global
3908    consistency which can not be reached in full generality without full profile
3909    rebuild from probabilities alone.  Doing so is not necessarily a good idea
3910    because frequencies and counts may be more realistic then probabilities.
3911
3912    In some cases (such as for elimination of early exits during full loop
3913    unrolling) the caller can ensure that profile will get consistent
3914    afterwards.  */
3915
3916 void
3917 force_edge_cold (edge e, bool impossible)
3918 {
3919   profile_count count_sum = profile_count::zero ();
3920   profile_probability prob_sum = profile_probability::never ();
3921   edge_iterator ei;
3922   edge e2;
3923   profile_count old_count = e->count;
3924   profile_probability old_probability = e->probability;
3925   bool uninitialized_exit = false;
3926
3927   profile_probability goal = (impossible ? profile_probability::never ()
3928                               : profile_probability::very_unlikely ());
3929
3930   /* If edge is already improbably or cold, just return.  */
3931   if (e->probability <= goal
3932       && (!impossible || e->count == profile_count::zero ()))
3933     return;
3934   FOR_EACH_EDGE (e2, ei, e->src->succs)
3935     if (e2 != e)
3936       {
3937         if (e2->count.initialized_p ())
3938           count_sum += e2->count;
3939         else
3940           uninitialized_exit = true;
3941         if (e2->probability.initialized_p ())
3942           prob_sum += e2->probability;
3943       }
3944
3945   /* If there are other edges out of e->src, redistribute probabilitity
3946      there.  */
3947   if (prob_sum > profile_probability::never ())
3948     {
3949       if (!(e->probability < goal))
3950         e->probability = goal;
3951       if (impossible)
3952         e->count = profile_count::zero ();
3953       else if (old_probability > profile_probability::never ())
3954         e->count = e->count.apply_probability (e->probability
3955                                                / old_probability);
3956       else
3957         e->count = e->count.apply_scale (1, REG_BR_PROB_BASE);
3958
3959       profile_probability prob_comp = prob_sum / e->probability.invert ();
3960
3961       if (dump_file && (dump_flags & TDF_DETAILS))
3962         fprintf (dump_file, "Making edge %i->%i %s by redistributing "
3963                  "probability to other edges.\n",
3964                  e->src->index, e->dest->index,
3965                  impossible ? "impossible" : "cold");
3966       profile_count count_sum2 = count_sum + old_count - e->count;
3967       FOR_EACH_EDGE (e2, ei, e->src->succs)
3968         if (e2 != e)
3969           {
3970             if (count_sum > 0)
3971               e2->count.apply_scale (count_sum2, count_sum);
3972             e2->probability /= prob_comp;
3973           }
3974       if (current_ir_type () != IR_GIMPLE
3975           && e->src != ENTRY_BLOCK_PTR_FOR_FN (cfun))
3976         update_br_prob_note (e->src);
3977     }
3978   /* If all edges out of e->src are unlikely, the basic block itself
3979      is unlikely.  */
3980   else
3981     {
3982       if (prob_sum == profile_probability::never ())
3983         e->probability = profile_probability::always ();
3984       else
3985         {
3986           if (impossible)
3987             e->probability = profile_probability::never ();
3988           /* If BB has some edges out that are not impossible, we can not
3989              assume that BB itself is.  */
3990           impossible = false;
3991         }
3992       if (current_ir_type () != IR_GIMPLE
3993           && e->src != ENTRY_BLOCK_PTR_FOR_FN (cfun))
3994         update_br_prob_note (e->src);
3995       if (e->src->count == profile_count::zero ())
3996         return;
3997       if (count_sum == profile_count::zero () && !uninitialized_exit
3998           && impossible)
3999         {
4000           bool found = false;
4001           if (e->src == ENTRY_BLOCK_PTR_FOR_FN (cfun))
4002             ;
4003           else if (current_ir_type () == IR_GIMPLE)
4004             for (gimple_stmt_iterator gsi = gsi_start_bb (e->src);
4005                  !gsi_end_p (gsi); gsi_next (&gsi))
4006               {
4007                 if (stmt_can_terminate_bb_p (gsi_stmt (gsi)))
4008                   {
4009                     found = true;
4010                     break;
4011                   }
4012               }
4013           /* FIXME: Implement RTL path.  */
4014           else
4015             found = true;
4016           if (!found)
4017             {
4018               if (dump_file && (dump_flags & TDF_DETAILS))
4019                 fprintf (dump_file,
4020                          "Making bb %i impossible and dropping count to 0.\n",
4021                          e->src->index);
4022               e->count = profile_count::zero ();
4023               e->src->count = profile_count::zero ();
4024               FOR_EACH_EDGE (e2, ei, e->src->preds)
4025                 force_edge_cold (e2, impossible);
4026               return;
4027             }
4028         }
4029
4030       /* If we did not adjusting, the source basic block has no likely edeges
4031          leaving other direction. In that case force that bb cold, too.
4032          This in general is difficult task to do, but handle special case when
4033          BB has only one predecestor.  This is common case when we are updating
4034          after loop transforms.  */
4035       if (!(prob_sum > profile_probability::never ())
4036           && count_sum == profile_count::zero ()
4037           && single_pred_p (e->src) && e->src->frequency > (impossible ? 0 : 1))
4038         {
4039           int old_frequency = e->src->frequency;
4040           if (dump_file && (dump_flags & TDF_DETAILS))
4041             fprintf (dump_file, "Making bb %i %s.\n", e->src->index,
4042                      impossible ? "impossible" : "cold");
4043           e->src->frequency = MIN (e->src->frequency, impossible ? 0 : 1);
4044           if (impossible)
4045             e->src->count = e->count = profile_count::zero ();
4046           else
4047             e->src->count = e->count = e->count.apply_scale (e->src->frequency,
4048                                                              old_frequency);
4049           force_edge_cold (single_pred_edge (e->src), impossible);
4050         }
4051       else if (dump_file && (dump_flags & TDF_DETAILS)
4052                && maybe_hot_bb_p (cfun, e->src))
4053         fprintf (dump_file, "Giving up on making bb %i %s.\n", e->src->index,
4054                  impossible ? "impossible" : "cold");
4055     }
4056 }
4057
4058 #if CHECKING_P
4059
4060 namespace selftest {
4061
4062 /* Test that value range of predictor values defined in predict.def is
4063    within range (50, 100].  */
4064
4065 struct branch_predictor
4066 {
4067   const char *name;
4068   unsigned probability;
4069 };
4070
4071 #define DEF_PREDICTOR(ENUM, NAME, HITRATE, FLAGS) { NAME, HITRATE },
4072
4073 static void
4074 test_prediction_value_range ()
4075 {
4076   branch_predictor predictors[] = {
4077 #include "predict.def"
4078     {NULL, -1U}
4079   };
4080
4081   for (unsigned i = 0; predictors[i].name != NULL; i++)
4082     {
4083       unsigned p = 100 * predictors[i].probability / REG_BR_PROB_BASE;
4084       ASSERT_TRUE (p > 50 && p <= 100);
4085     }
4086 }
4087
4088 #undef DEF_PREDICTOR
4089
4090 /* Run all of the selfests within this file.  */
4091
4092 void
4093 predict_c_tests ()
4094 {
4095   test_prediction_value_range ();
4096 }
4097
4098 } // namespace selftest
4099 #endif /* CHECKING_P.  */