main/gcc/predict.c

   1 /* Branch prediction routines for the GNU compiler.
   2    Copyright (C) 2000-2014 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20 /* References:
  21
  22    [1] "Branch Prediction for Free"
  23        Ball and Larus; PLDI '93.
  24    [2] "Static Branch Frequency and Program Profile Analysis"
  25        Wu and Larus; MICRO-27.
  26    [3] "Corpus-based Static Branch Prediction"
  27        Calder, Grunwald, Lindsay, Martin, Mozer, and Zorn; PLDI '95.  */
  28
  29
  30 #include "config.h"
  31 #include "system.h"
  32 #include "coretypes.h"
  33 #include "tm.h"
  34 #include "tree.h"
  35 #include "calls.h"
  36 #include "rtl.h"
  37 #include "tm_p.h"
  38 #include "hard-reg-set.h"
  39 #include "basic-block.h"
  40 #include "insn-config.h"
  41 #include "regs.h"
  42 #include "flags.h"
  43 #include "function.h"
  44 #include "except.h"
  45 #include "diagnostic-core.h"
  46 #include "recog.h"
  47 #include "expr.h"
  48 #include "predict.h"
  49 #include "coverage.h"
  50 #include "sreal.h"
  51 #include "params.h"
  52 #include "target.h"
  53 #include "cfgloop.h"
  54 #include "pointer-set.h"
  55 #include "tree-ssa-alias.h"
  56 #include "internal-fn.h"
  57 #include "gimple-expr.h"
  58 #include "is-a.h"
  59 #include "gimple.h"
  60 #include "gimple-iterator.h"
  61 #include "gimple-ssa.h"
  62 #include "cgraph.h"
  63 #include "tree-cfg.h"
  64 #include "tree-phinodes.h"
  65 #include "ssa-iterators.h"
  66 #include "tree-ssa-loop-niter.h"
  67 #include "tree-ssa-loop.h"
  68 #include "tree-pass.h"
  69 #include "tree-scalar-evolution.h"
  70 #include "cfgloop.h"
  71
  72 /* real constants: 0, 1, 1-1/REG_BR_PROB_BASE, REG_BR_PROB_BASE,
  73                    1/REG_BR_PROB_BASE, 0.5, BB_FREQ_MAX.  */
  74 static sreal real_zero, real_one, real_almost_one, real_br_prob_base,
  75              real_inv_br_prob_base, real_one_half, real_bb_freq_max;
  76
  77 static void combine_predictions_for_insn (rtx, basic_block);
  78 static void dump_prediction (FILE *, enum br_predictor, int, basic_block, int);
  79 static void predict_paths_leading_to (basic_block, enum br_predictor, enum prediction);
  80 static void predict_paths_leading_to_edge (edge, enum br_predictor, enum prediction);
  81 static bool can_predict_insn_p (const_rtx);
  82
  83 /* Information we hold about each branch predictor.
  84    Filled using information from predict.def.  */
  85
  86 struct predictor_info
  87 {
  88   const char *const name;       /* Name used in the debugging dumps.  */
  89   const int hitrate;            /* Expected hitrate used by
  90                                    predict_insn_def call.  */
  91   const int flags;
  92 };
  93
  94 /* Use given predictor without Dempster-Shaffer theory if it matches
  95    using first_match heuristics.  */
  96 #define PRED_FLAG_FIRST_MATCH 1
  97
  98 /* Recompute hitrate in percent to our representation.  */
  99
 100 #define HITRATE(VAL) ((int) ((VAL) * REG_BR_PROB_BASE + 50) / 100)
 101
 102 #define DEF_PREDICTOR(ENUM, NAME, HITRATE, FLAGS) {NAME, HITRATE, FLAGS},
 103 static const struct predictor_info predictor_info[]= {
 104 #include "predict.def"
 105
 106   /* Upper bound on predictors.  */
 107   {NULL, 0, 0}
 108 };
 109 #undef DEF_PREDICTOR
 110
 111 /* Return TRUE if frequency FREQ is considered to be hot.  */
 112
 113 static inline bool
 114 maybe_hot_frequency_p (struct function *fun, int freq)
 115 {
 116   struct cgraph_node *node = cgraph_get_node (fun->decl);
 117   if (!profile_info || !flag_branch_probabilities)
 118     {
 119       if (node->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED)
 120         return false;
 121       if (node->frequency == NODE_FREQUENCY_HOT)
 122         return true;
 123     }
 124   if (profile_status_for_fn (fun) == PROFILE_ABSENT)
 125     return true;
 126   if (node->frequency == NODE_FREQUENCY_EXECUTED_ONCE
 127       && freq < (ENTRY_BLOCK_PTR_FOR_FN (fun)->frequency * 2 / 3))
 128     return false;
 129   if (PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION) == 0)
 130     return false;
 131   if (freq < (ENTRY_BLOCK_PTR_FOR_FN (fun)->frequency
 132               / PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION)))
 133     return false;
 134   return true;
 135 }
 136
 137 static gcov_type min_count = -1;
 138
 139 /* Determine the threshold for hot BB counts.  */
 140
 141 gcov_type
 142 get_hot_bb_threshold ()
 143 {
 144   gcov_working_set_t *ws;
 145   if (min_count == -1)
 146     {
 147       ws = find_working_set (PARAM_VALUE (HOT_BB_COUNT_WS_PERMILLE));
 148       gcc_assert (ws);
 149       min_count = ws->min_counter;
 150     }
 151   return min_count;
 152 }
 153
 154 /* Set the threshold for hot BB counts.  */
 155
 156 void
 157 set_hot_bb_threshold (gcov_type min)
 158 {
 159   min_count = min;
 160 }
 161
 162 /* Return TRUE if frequency FREQ is considered to be hot.  */
 163
 164 bool
 165 maybe_hot_count_p (struct function *fun, gcov_type count)
 166 {
 167   if (fun && profile_status_for_fn (fun) != PROFILE_READ)
 168     return true;
 169   if (!profile_info)
 170     return false;
 171   /* Code executed at most once is not hot.  */
 172   if (profile_info->runs >= count)
 173     return false;
 174   return (count >= get_hot_bb_threshold ());
 175 }
 176
 177 /* Return true in case BB can be CPU intensive and should be optimized
 178    for maximal performance.  */
 179
 180 bool
 181 maybe_hot_bb_p (struct function *fun, const_basic_block bb)
 182 {
 183   gcc_checking_assert (fun);
 184   if (profile_status_for_fn (fun) == PROFILE_READ)
 185     return maybe_hot_count_p (fun, bb->count);
 186   return maybe_hot_frequency_p (fun, bb->frequency);
 187 }
 188
 189 /* Return true if the call can be hot.  */
 190
 191 bool
 192 cgraph_maybe_hot_edge_p (struct cgraph_edge *edge)
 193 {
 194   if (profile_info && flag_branch_probabilities
 195       && !maybe_hot_count_p (NULL,
 196                              edge->count))
 197     return false;
 198   if (edge->caller->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED
 199       || (edge->callee
 200           && edge->callee->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED))
 201     return false;
 202   if (edge->caller->frequency > NODE_FREQUENCY_UNLIKELY_EXECUTED
 203       && (edge->callee
 204           && edge->callee->frequency <= NODE_FREQUENCY_EXECUTED_ONCE))
 205     return false;
 206   if (optimize_size)
 207     return false;
 208   if (edge->caller->frequency == NODE_FREQUENCY_HOT)
 209     return true;
 210   if (edge->caller->frequency == NODE_FREQUENCY_EXECUTED_ONCE
 211       && edge->frequency < CGRAPH_FREQ_BASE * 3 / 2)
 212     return false;
 213   if (flag_guess_branch_prob)
 214     {
 215       if (PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION) == 0
 216           || edge->frequency <= (CGRAPH_FREQ_BASE
 217                                  / PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION)))
 218         return false;
 219     }
 220   return true;
 221 }
 222
 223 /* Return true in case BB can be CPU intensive and should be optimized
 224    for maximal performance.  */
 225
 226 bool
 227 maybe_hot_edge_p (edge e)
 228 {
 229   if (profile_status_for_fn (cfun) == PROFILE_READ)
 230     return maybe_hot_count_p (cfun, e->count);
 231   return maybe_hot_frequency_p (cfun, EDGE_FREQUENCY (e));
 232 }
 233
 234
 235
 236 /* Return true if profile COUNT and FREQUENCY, or function FUN static
 237    node frequency reflects never being executed.  */
 238
 239 static bool
 240 probably_never_executed (struct function *fun,
 241                          gcov_type count, int frequency)
 242 {
 243   gcc_checking_assert (fun);
 244   if (profile_status_for_fn (cfun) == PROFILE_READ)
 245     {
 246       int unlikely_count_fraction = PARAM_VALUE (UNLIKELY_BB_COUNT_FRACTION);
 247       if (count * unlikely_count_fraction >= profile_info->runs)
 248         return false;
 249       if (!frequency)
 250         return true;
 251       if (!ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency)
 252         return false;
 253       if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->count)
 254         {
 255           gcov_type computed_count;
 256           /* Check for possibility of overflow, in which case entry bb count
 257              is large enough to do the division first without losing much
 258              precision.  */
 259           if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->count < REG_BR_PROB_BASE *
 260               REG_BR_PROB_BASE)
 261             {
 262               gcov_type scaled_count
 263                   = frequency * ENTRY_BLOCK_PTR_FOR_FN (cfun)->count *
 264              unlikely_count_fraction;
 265               computed_count = RDIV (scaled_count,
 266                                      ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency);
 267             }
 268           else
 269             {
 270               computed_count = RDIV (ENTRY_BLOCK_PTR_FOR_FN (cfun)->count,
 271                                      ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency);
 272               computed_count *= frequency * unlikely_count_fraction;
 273             }
 274           if (computed_count >= profile_info->runs)
 275             return false;
 276         }
 277       return true;
 278     }
 279   if ((!profile_info || !flag_branch_probabilities)
 280       && (cgraph_get_node (fun->decl)->frequency
 281           == NODE_FREQUENCY_UNLIKELY_EXECUTED))
 282     return true;
 283   return false;
 284 }
 285
 286
 287 /* Return true in case BB is probably never executed.  */
 288
 289 bool
 290 probably_never_executed_bb_p (struct function *fun, const_basic_block bb)
 291 {
 292   return probably_never_executed (fun, bb->count, bb->frequency);
 293 }
 294
 295
 296 /* Return true in case edge E is probably never executed.  */
 297
 298 bool
 299 probably_never_executed_edge_p (struct function *fun, edge e)
 300 {
 301   return probably_never_executed (fun, e->count, EDGE_FREQUENCY (e));
 302 }
 303
 304 /* Return true if NODE should be optimized for size.  */
 305
 306 bool
 307 cgraph_optimize_for_size_p (struct cgraph_node *node)
 308 {
 309   if (optimize_size)
 310     return true;
 311   if (node && (node->frequency == NODE_FREQUENCY_UNLIKELY_EXECUTED))
 312     return true;
 313   else
 314     return false;
 315 }
 316
 317 /* Return true when current function should always be optimized for size.  */
 318
 319 bool
 320 optimize_function_for_size_p (struct function *fun)
 321 {
 322   if (optimize_size)
 323     return true;
 324   if (!fun || !fun->decl)
 325     return false;
 326   return cgraph_optimize_for_size_p (cgraph_get_node (fun->decl));
 327 }
 328
 329 /* Return true when current function should always be optimized for speed.  */
 330
 331 bool
 332 optimize_function_for_speed_p (struct function *fun)
 333 {
 334   return !optimize_function_for_size_p (fun);
 335 }
 336
 337 /* Return TRUE when BB should be optimized for size.  */
 338
 339 bool
 340 optimize_bb_for_size_p (const_basic_block bb)
 341 {
 342   return optimize_function_for_size_p (cfun) || !maybe_hot_bb_p (cfun, bb);
 343 }
 344
 345 /* Return TRUE when BB should be optimized for speed.  */
 346
 347 bool
 348 optimize_bb_for_speed_p (const_basic_block bb)
 349 {
 350   return !optimize_bb_for_size_p (bb);
 351 }
 352
 353 /* Return TRUE when BB should be optimized for size.  */
 354
 355 bool
 356 optimize_edge_for_size_p (edge e)
 357 {
 358   return optimize_function_for_size_p (cfun) || !maybe_hot_edge_p (e);
 359 }
 360
 361 /* Return TRUE when BB should be optimized for speed.  */
 362
 363 bool
 364 optimize_edge_for_speed_p (edge e)
 365 {
 366   return !optimize_edge_for_size_p (e);
 367 }
 368
 369 /* Return TRUE when BB should be optimized for size.  */
 370
 371 bool
 372 optimize_insn_for_size_p (void)
 373 {
 374   return optimize_function_for_size_p (cfun) || !crtl->maybe_hot_insn_p;
 375 }
 376
 377 /* Return TRUE when BB should be optimized for speed.  */
 378
 379 bool
 380 optimize_insn_for_speed_p (void)
 381 {
 382   return !optimize_insn_for_size_p ();
 383 }
 384
 385 /* Return TRUE when LOOP should be optimized for size.  */
 386
 387 bool
 388 optimize_loop_for_size_p (struct loop *loop)
 389 {
 390   return optimize_bb_for_size_p (loop->header);
 391 }
 392
 393 /* Return TRUE when LOOP should be optimized for speed.  */
 394
 395 bool
 396 optimize_loop_for_speed_p (struct loop *loop)
 397 {
 398   return optimize_bb_for_speed_p (loop->header);
 399 }
 400
 401 /* Return TRUE when LOOP nest should be optimized for speed.  */
 402
 403 bool
 404 optimize_loop_nest_for_speed_p (struct loop *loop)
 405 {
 406   struct loop *l = loop;
 407   if (optimize_loop_for_speed_p (loop))
 408     return true;
 409   l = loop->inner;
 410   while (l && l != loop)
 411     {
 412       if (optimize_loop_for_speed_p (l))
 413         return true;
 414       if (l->inner)
 415         l = l->inner;
 416       else if (l->next)
 417         l = l->next;
 418       else
 419         {
 420           while (l != loop && !l->next)
 421             l = loop_outer (l);
 422           if (l != loop)
 423             l = l->next;
 424         }
 425     }
 426   return false;
 427 }
 428
 429 /* Return TRUE when LOOP nest should be optimized for size.  */
 430
 431 bool
 432 optimize_loop_nest_for_size_p (struct loop *loop)
 433 {
 434   return !optimize_loop_nest_for_speed_p (loop);
 435 }
 436
 437 /* Return true when edge E is likely to be well predictable by branch
 438    predictor.  */
 439
 440 bool
 441 predictable_edge_p (edge e)
 442 {
 443   if (profile_status_for_fn (cfun) == PROFILE_ABSENT)
 444     return false;
 445   if ((e->probability
 446        <= PARAM_VALUE (PARAM_PREDICTABLE_BRANCH_OUTCOME) * REG_BR_PROB_BASE / 100)
 447       || (REG_BR_PROB_BASE - e->probability
 448           <= PARAM_VALUE (PARAM_PREDICTABLE_BRANCH_OUTCOME) * REG_BR_PROB_BASE / 100))
 449     return true;
 450   return false;
 451 }
 452
 453
 454 /* Set RTL expansion for BB profile.  */
 455
 456 void
 457 rtl_profile_for_bb (basic_block bb)
 458 {
 459   crtl->maybe_hot_insn_p = maybe_hot_bb_p (cfun, bb);
 460 }
 461
 462 /* Set RTL expansion for edge profile.  */
 463
 464 void
 465 rtl_profile_for_edge (edge e)
 466 {
 467   crtl->maybe_hot_insn_p = maybe_hot_edge_p (e);
 468 }
 469
 470 /* Set RTL expansion to default mode (i.e. when profile info is not known).  */
 471 void
 472 default_rtl_profile (void)
 473 {
 474   crtl->maybe_hot_insn_p = true;
 475 }
 476
 477 /* Return true if the one of outgoing edges is already predicted by
 478    PREDICTOR.  */
 479
 480 bool
 481 rtl_predicted_by_p (const_basic_block bb, enum br_predictor predictor)
 482 {
 483   rtx note;
 484   if (!INSN_P (BB_END (bb)))
 485     return false;
 486   for (note = REG_NOTES (BB_END (bb)); note; note = XEXP (note, 1))
 487     if (REG_NOTE_KIND (note) == REG_BR_PRED
 488         && INTVAL (XEXP (XEXP (note, 0), 0)) == (int)predictor)
 489       return true;
 490   return false;
 491 }
 492
 493 /* This map contains for a basic block the list of predictions for the
 494    outgoing edges.  */
 495
 496 static struct pointer_map_t *bb_predictions;
 497
 498 /*  Structure representing predictions in tree level. */
 499
 500 struct edge_prediction {
 501     struct edge_prediction *ep_next;
 502     edge ep_edge;
 503     enum br_predictor ep_predictor;
 504     int ep_probability;
 505 };
 506
 507 /* Return true if the one of outgoing edges is already predicted by
 508    PREDICTOR.  */
 509
 510 bool
 511 gimple_predicted_by_p (const_basic_block bb, enum br_predictor predictor)
 512 {
 513   struct edge_prediction *i;
 514   void **preds = pointer_map_contains (bb_predictions, bb);
 515
 516   if (!preds)
 517     return false;
 518
 519   for (i = (struct edge_prediction *) *preds; i; i = i->ep_next)
 520     if (i->ep_predictor == predictor)
 521       return true;
 522   return false;
 523 }
 524
 525 /* Return true when the probability of edge is reliable.
 526
 527    The profile guessing code is good at predicting branch outcome (ie.
 528    taken/not taken), that is predicted right slightly over 75% of time.
 529    It is however notoriously poor on predicting the probability itself.
 530    In general the profile appear a lot flatter (with probabilities closer
 531    to 50%) than the reality so it is bad idea to use it to drive optimization
 532    such as those disabling dynamic branch prediction for well predictable
 533    branches.
 534
 535    There are two exceptions - edges leading to noreturn edges and edges
 536    predicted by number of iterations heuristics are predicted well.  This macro
 537    should be able to distinguish those, but at the moment it simply check for
 538    noreturn heuristic that is only one giving probability over 99% or bellow
 539    1%.  In future we might want to propagate reliability information across the
 540    CFG if we find this information useful on multiple places.   */
 541 static bool
 542 probability_reliable_p (int prob)
 543 {
 544   return (profile_status_for_fn (cfun) == PROFILE_READ
 545           || (profile_status_for_fn (cfun) == PROFILE_GUESSED
 546               && (prob <= HITRATE (1) || prob >= HITRATE (99))));
 547 }
 548
 549 /* Same predicate as above, working on edges.  */
 550 bool
 551 edge_probability_reliable_p (const_edge e)
 552 {
 553   return probability_reliable_p (e->probability);
 554 }
 555
 556 /* Same predicate as edge_probability_reliable_p, working on notes.  */
 557 bool
 558 br_prob_note_reliable_p (const_rtx note)
 559 {
 560   gcc_assert (REG_NOTE_KIND (note) == REG_BR_PROB);
 561   return probability_reliable_p (XINT (note, 0));
 562 }
 563
 564 static void
 565 predict_insn (rtx insn, enum br_predictor predictor, int probability)
 566 {
 567   gcc_assert (any_condjump_p (insn));
 568   if (!flag_guess_branch_prob)
 569     return;
 570
 571   add_reg_note (insn, REG_BR_PRED,
 572                 gen_rtx_CONCAT (VOIDmode,
 573                                 GEN_INT ((int) predictor),
 574                                 GEN_INT ((int) probability)));
 575 }
 576
 577 /* Predict insn by given predictor.  */
 578
 579 void
 580 predict_insn_def (rtx insn, enum br_predictor predictor,
 581                   enum prediction taken)
 582 {
 583    int probability = predictor_info[(int) predictor].hitrate;
 584
 585    if (taken != TAKEN)
 586      probability = REG_BR_PROB_BASE - probability;
 587
 588    predict_insn (insn, predictor, probability);
 589 }
 590
 591 /* Predict edge E with given probability if possible.  */
 592
 593 void
 594 rtl_predict_edge (edge e, enum br_predictor predictor, int probability)
 595 {
 596   rtx last_insn;
 597   last_insn = BB_END (e->src);
 598
 599   /* We can store the branch prediction information only about
 600      conditional jumps.  */
 601   if (!any_condjump_p (last_insn))
 602     return;
 603
 604   /* We always store probability of branching.  */
 605   if (e->flags & EDGE_FALLTHRU)
 606     probability = REG_BR_PROB_BASE - probability;
 607
 608   predict_insn (last_insn, predictor, probability);
 609 }
 610
 611 /* Predict edge E with the given PROBABILITY.  */
 612 void
 613 gimple_predict_edge (edge e, enum br_predictor predictor, int probability)
 614 {
 615   gcc_assert (profile_status_for_fn (cfun) != PROFILE_GUESSED);
 616   if ((e->src != ENTRY_BLOCK_PTR_FOR_FN (cfun) && EDGE_COUNT (e->src->succs) >
 617        1)
 618       && flag_guess_branch_prob && optimize)
 619     {
 620       struct edge_prediction *i = XNEW (struct edge_prediction);
 621       void **preds = pointer_map_insert (bb_predictions, e->src);
 622
 623       i->ep_next = (struct edge_prediction *) *preds;
 624       *preds = i;
 625       i->ep_probability = probability;
 626       i->ep_predictor = predictor;
 627       i->ep_edge = e;
 628     }
 629 }
 630
 631 /* Remove all predictions on given basic block that are attached
 632    to edge E.  */
 633 void
 634 remove_predictions_associated_with_edge (edge e)
 635 {
 636   void **preds;
 637
 638   if (!bb_predictions)
 639     return;
 640
 641   preds = pointer_map_contains (bb_predictions, e->src);
 642
 643   if (preds)
 644     {
 645       struct edge_prediction **prediction = (struct edge_prediction **) preds;
 646       struct edge_prediction *next;
 647
 648       while (*prediction)
 649         {
 650           if ((*prediction)->ep_edge == e)
 651             {
 652               next = (*prediction)->ep_next;
 653               free (*prediction);
 654               *prediction = next;
 655             }
 656           else
 657             prediction = &((*prediction)->ep_next);
 658         }
 659     }
 660 }
 661
 662 /* Clears the list of predictions stored for BB.  */
 663
 664 static void
 665 clear_bb_predictions (basic_block bb)
 666 {
 667   void **preds = pointer_map_contains (bb_predictions, bb);
 668   struct edge_prediction *pred, *next;
 669
 670   if (!preds)
 671     return;
 672
 673   for (pred = (struct edge_prediction *) *preds; pred; pred = next)
 674     {
 675       next = pred->ep_next;
 676       free (pred);
 677     }
 678   *preds = NULL;
 679 }
 680
 681 /* Return true when we can store prediction on insn INSN.
 682    At the moment we represent predictions only on conditional
 683    jumps, not at computed jump or other complicated cases.  */
 684 static bool
 685 can_predict_insn_p (const_rtx insn)
 686 {
 687   return (JUMP_P (insn)
 688           && any_condjump_p (insn)
 689           && EDGE_COUNT (BLOCK_FOR_INSN (insn)->succs) >= 2);
 690 }
 691
 692 /* Predict edge E by given predictor if possible.  */
 693
 694 void
 695 predict_edge_def (edge e, enum br_predictor predictor,
 696                   enum prediction taken)
 697 {
 698    int probability = predictor_info[(int) predictor].hitrate;
 699
 700    if (taken != TAKEN)
 701      probability = REG_BR_PROB_BASE - probability;
 702
 703    predict_edge (e, predictor, probability);
 704 }
 705
 706 /* Invert all branch predictions or probability notes in the INSN.  This needs
 707    to be done each time we invert the condition used by the jump.  */
 708
 709 void
 710 invert_br_probabilities (rtx insn)
 711 {
 712   rtx note;
 713
 714   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
 715     if (REG_NOTE_KIND (note) == REG_BR_PROB)
 716       XINT (note, 0) = REG_BR_PROB_BASE - XINT (note, 0);
 717     else if (REG_NOTE_KIND (note) == REG_BR_PRED)
 718       XEXP (XEXP (note, 0), 1)
 719         = GEN_INT (REG_BR_PROB_BASE - INTVAL (XEXP (XEXP (note, 0), 1)));
 720 }
 721
 722 /* Dump information about the branch prediction to the output file.  */
 723
 724 static void
 725 dump_prediction (FILE *file, enum br_predictor predictor, int probability,
 726                  basic_block bb, int used)
 727 {
 728   edge e;
 729   edge_iterator ei;
 730
 731   if (!file)
 732     return;
 733
 734   FOR_EACH_EDGE (e, ei, bb->succs)
 735     if (! (e->flags & EDGE_FALLTHRU))
 736       break;
 737
 738   fprintf (file, "  %s heuristics%s: %.1f%%",
 739            predictor_info[predictor].name,
 740            used ? "" : " (ignored)", probability * 100.0 / REG_BR_PROB_BASE);
 741
 742   if (bb->count)
 743     {
 744       fprintf (file, "  exec ");
 745       fprintf (file, HOST_WIDEST_INT_PRINT_DEC, bb->count);
 746       if (e)
 747         {
 748           fprintf (file, " hit ");
 749           fprintf (file, HOST_WIDEST_INT_PRINT_DEC, e->count);
 750           fprintf (file, " (%.1f%%)", e->count * 100.0 / bb->count);
 751         }
 752     }
 753
 754   fprintf (file, "\n");
 755 }
 756
 757 /* We can not predict the probabilities of outgoing edges of bb.  Set them
 758    evenly and hope for the best.  */
 759 static void
 760 set_even_probabilities (basic_block bb)
 761 {
 762   int nedges = 0;
 763   edge e;
 764   edge_iterator ei;
 765
 766   FOR_EACH_EDGE (e, ei, bb->succs)
 767     if (!(e->flags & (EDGE_EH | EDGE_FAKE)))
 768       nedges ++;
 769   FOR_EACH_EDGE (e, ei, bb->succs)
 770     if (!(e->flags & (EDGE_EH | EDGE_FAKE)))
 771       e->probability = (REG_BR_PROB_BASE + nedges / 2) / nedges;
 772     else
 773       e->probability = 0;
 774 }
 775
 776 /* Combine all REG_BR_PRED notes into single probability and attach REG_BR_PROB
 777    note if not already present.  Remove now useless REG_BR_PRED notes.  */
 778
 779 static void
 780 combine_predictions_for_insn (rtx insn, basic_block bb)
 781 {
 782   rtx prob_note;
 783   rtx *pnote;
 784   rtx note;
 785   int best_probability = PROB_EVEN;
 786   enum br_predictor best_predictor = END_PREDICTORS;
 787   int combined_probability = REG_BR_PROB_BASE / 2;
 788   int d;
 789   bool first_match = false;
 790   bool found = false;
 791
 792   if (!can_predict_insn_p (insn))
 793     {
 794       set_even_probabilities (bb);
 795       return;
 796     }
 797
 798   prob_note = find_reg_note (insn, REG_BR_PROB, 0);
 799   pnote = &REG_NOTES (insn);
 800   if (dump_file)
 801     fprintf (dump_file, "Predictions for insn %i bb %i\n", INSN_UID (insn),
 802              bb->index);
 803
 804   /* We implement "first match" heuristics and use probability guessed
 805      by predictor with smallest index.  */
 806   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
 807     if (REG_NOTE_KIND (note) == REG_BR_PRED)
 808       {
 809         enum br_predictor predictor = ((enum br_predictor)
 810                                        INTVAL (XEXP (XEXP (note, 0), 0)));
 811         int probability = INTVAL (XEXP (XEXP (note, 0), 1));
 812
 813         found = true;
 814         if (best_predictor > predictor)
 815           best_probability = probability, best_predictor = predictor;
 816
 817         d = (combined_probability * probability
 818              + (REG_BR_PROB_BASE - combined_probability)
 819              * (REG_BR_PROB_BASE - probability));
 820
 821         /* Use FP math to avoid overflows of 32bit integers.  */
 822         if (d == 0)
 823           /* If one probability is 0% and one 100%, avoid division by zero.  */
 824           combined_probability = REG_BR_PROB_BASE / 2;
 825         else
 826           combined_probability = (((double) combined_probability) * probability
 827                                   * REG_BR_PROB_BASE / d + 0.5);
 828       }
 829
 830   /* Decide which heuristic to use.  In case we didn't match anything,
 831      use no_prediction heuristic, in case we did match, use either
 832      first match or Dempster-Shaffer theory depending on the flags.  */
 833
 834   if (predictor_info [best_predictor].flags & PRED_FLAG_FIRST_MATCH)
 835     first_match = true;
 836
 837   if (!found)
 838     dump_prediction (dump_file, PRED_NO_PREDICTION,
 839                      combined_probability, bb, true);
 840   else
 841     {
 842       dump_prediction (dump_file, PRED_DS_THEORY, combined_probability,
 843                        bb, !first_match);
 844       dump_prediction (dump_file, PRED_FIRST_MATCH, best_probability,
 845                        bb, first_match);
 846     }
 847
 848   if (first_match)
 849     combined_probability = best_probability;
 850   dump_prediction (dump_file, PRED_COMBINED, combined_probability, bb, true);
 851
 852   while (*pnote)
 853     {
 854       if (REG_NOTE_KIND (*pnote) == REG_BR_PRED)
 855         {
 856           enum br_predictor predictor = ((enum br_predictor)
 857                                          INTVAL (XEXP (XEXP (*pnote, 0), 0)));
 858           int probability = INTVAL (XEXP (XEXP (*pnote, 0), 1));
 859
 860           dump_prediction (dump_file, predictor, probability, bb,
 861                            !first_match || best_predictor == predictor);
 862           *pnote = XEXP (*pnote, 1);
 863         }
 864       else
 865         pnote = &XEXP (*pnote, 1);
 866     }
 867
 868   if (!prob_note)
 869     {
 870       add_int_reg_note (insn, REG_BR_PROB, combined_probability);
 871
 872       /* Save the prediction into CFG in case we are seeing non-degenerated
 873          conditional jump.  */
 874       if (!single_succ_p (bb))
 875         {
 876           BRANCH_EDGE (bb)->probability = combined_probability;
 877           FALLTHRU_EDGE (bb)->probability
 878             = REG_BR_PROB_BASE - combined_probability;
 879         }
 880     }
 881   else if (!single_succ_p (bb))
 882     {
 883       int prob = XINT (prob_note, 0);
 884
 885       BRANCH_EDGE (bb)->probability = prob;
 886       FALLTHRU_EDGE (bb)->probability = REG_BR_PROB_BASE - prob;
 887     }
 888   else
 889     single_succ_edge (bb)->probability = REG_BR_PROB_BASE;
 890 }
 891
 892 /* Combine predictions into single probability and store them into CFG.
 893    Remove now useless prediction entries.  */
 894
 895 static void
 896 combine_predictions_for_bb (basic_block bb)
 897 {
 898   int best_probability = PROB_EVEN;
 899   enum br_predictor best_predictor = END_PREDICTORS;
 900   int combined_probability = REG_BR_PROB_BASE / 2;
 901   int d;
 902   bool first_match = false;
 903   bool found = false;
 904   struct edge_prediction *pred;
 905   int nedges = 0;
 906   edge e, first = NULL, second = NULL;
 907   edge_iterator ei;
 908   void **preds;
 909
 910   FOR_EACH_EDGE (e, ei, bb->succs)
 911     if (!(e->flags & (EDGE_EH | EDGE_FAKE)))
 912       {
 913         nedges ++;
 914         if (first && !second)
 915           second = e;
 916         if (!first)
 917           first = e;
 918       }
 919
 920   /* When there is no successor or only one choice, prediction is easy.
 921
 922      We are lazy for now and predict only basic blocks with two outgoing
 923      edges.  It is possible to predict generic case too, but we have to
 924      ignore first match heuristics and do more involved combining.  Implement
 925      this later.  */
 926   if (nedges != 2)
 927     {
 928       if (!bb->count)
 929         set_even_probabilities (bb);
 930       clear_bb_predictions (bb);
 931       if (dump_file)
 932         fprintf (dump_file, "%i edges in bb %i predicted to even probabilities\n",
 933                  nedges, bb->index);
 934       return;
 935     }
 936
 937   if (dump_file)
 938     fprintf (dump_file, "Predictions for bb %i\n", bb->index);
 939
 940   preds = pointer_map_contains (bb_predictions, bb);
 941   if (preds)
 942     {
 943       /* We implement "first match" heuristics and use probability guessed
 944          by predictor with smallest index.  */
 945       for (pred = (struct edge_prediction *) *preds; pred; pred = pred->ep_next)
 946         {
 947           enum br_predictor predictor = pred->ep_predictor;
 948           int probability = pred->ep_probability;
 949
 950           if (pred->ep_edge != first)
 951             probability = REG_BR_PROB_BASE - probability;
 952
 953           found = true;
 954           /* First match heuristics would be widly confused if we predicted
 955              both directions.  */
 956           if (best_predictor > predictor)
 957             {
 958               struct edge_prediction *pred2;
 959               int prob = probability;
 960
 961               for (pred2 = (struct edge_prediction *) *preds;
 962                    pred2; pred2 = pred2->ep_next)
 963                if (pred2 != pred && pred2->ep_predictor == pred->ep_predictor)
 964                  {
 965                    int probability2 = pred->ep_probability;
 966
 967                    if (pred2->ep_edge != first)
 968                      probability2 = REG_BR_PROB_BASE - probability2;
 969
 970                    if ((probability < REG_BR_PROB_BASE / 2) !=
 971                        (probability2 < REG_BR_PROB_BASE / 2))
 972                      break;
 973
 974                    /* If the same predictor later gave better result, go for it! */
 975                    if ((probability >= REG_BR_PROB_BASE / 2 && (probability2 > probability))
 976                        || (probability <= REG_BR_PROB_BASE / 2 && (probability2 < probability)))
 977                      prob = probability2;
 978                  }
 979               if (!pred2)
 980                 best_probability = prob, best_predictor = predictor;
 981             }
 982
 983           d = (combined_probability * probability
 984                + (REG_BR_PROB_BASE - combined_probability)
 985                * (REG_BR_PROB_BASE - probability));
 986
 987           /* Use FP math to avoid overflows of 32bit integers.  */
 988           if (d == 0)
 989             /* If one probability is 0% and one 100%, avoid division by zero.  */
 990             combined_probability = REG_BR_PROB_BASE / 2;
 991           else
 992             combined_probability = (((double) combined_probability)
 993                                     * probability
 994                                     * REG_BR_PROB_BASE / d + 0.5);
 995         }
 996     }
 997
 998   /* Decide which heuristic to use.  In case we didn't match anything,
 999      use no_prediction heuristic, in case we did match, use either
1000      first match or Dempster-Shaffer theory depending on the flags.  */
1001
1002   if (predictor_info [best_predictor].flags & PRED_FLAG_FIRST_MATCH)
1003     first_match = true;
1004
1005   if (!found)
1006     dump_prediction (dump_file, PRED_NO_PREDICTION, combined_probability, bb, true);
1007   else
1008     {
1009       dump_prediction (dump_file, PRED_DS_THEORY, combined_probability, bb,
1010                        !first_match);
1011       dump_prediction (dump_file, PRED_FIRST_MATCH, best_probability, bb,
1012                        first_match);
1013     }
1014
1015   if (first_match)
1016     combined_probability = best_probability;
1017   dump_prediction (dump_file, PRED_COMBINED, combined_probability, bb, true);
1018
1019   if (preds)
1020     {
1021       for (pred = (struct edge_prediction *) *preds; pred; pred = pred->ep_next)
1022         {
1023           enum br_predictor predictor = pred->ep_predictor;
1024           int probability = pred->ep_probability;
1025
1026           if (pred->ep_edge != EDGE_SUCC (bb, 0))
1027             probability = REG_BR_PROB_BASE - probability;
1028           dump_prediction (dump_file, predictor, probability, bb,
1029                            !first_match || best_predictor == predictor);
1030         }
1031     }
1032   clear_bb_predictions (bb);
1033
1034   if (!bb->count)
1035     {
1036       first->probability = combined_probability;
1037       second->probability = REG_BR_PROB_BASE - combined_probability;
1038     }
1039 }
1040
1041 /* Check if T1 and T2 satisfy the IV_COMPARE condition.
1042    Return the SSA_NAME if the condition satisfies, NULL otherwise.
1043
1044    T1 and T2 should be one of the following cases:
1045      1. T1 is SSA_NAME, T2 is NULL
1046      2. T1 is SSA_NAME, T2 is INTEGER_CST between [-4, 4]
1047      3. T2 is SSA_NAME, T1 is INTEGER_CST between [-4, 4]  */
1048
1049 static tree
1050 strips_small_constant (tree t1, tree t2)
1051 {
1052   tree ret = NULL;
1053   int value = 0;
1054
1055   if (!t1)
1056     return NULL;
1057   else if (TREE_CODE (t1) == SSA_NAME)
1058     ret = t1;
1059   else if (tree_fits_shwi_p (t1))
1060     value = tree_to_shwi (t1);
1061   else
1062     return NULL;
1063
1064   if (!t2)
1065     return ret;
1066   else if (tree_fits_shwi_p (t2))
1067     value = tree_to_shwi (t2);
1068   else if (TREE_CODE (t2) == SSA_NAME)
1069     {
1070       if (ret)
1071         return NULL;
1072       else
1073         ret = t2;
1074     }
1075
1076   if (value <= 4 && value >= -4)
1077     return ret;
1078   else
1079     return NULL;
1080 }
1081
1082 /* Return the SSA_NAME in T or T's operands.
1083    Return NULL if SSA_NAME cannot be found.  */
1084
1085 static tree
1086 get_base_value (tree t)
1087 {
1088   if (TREE_CODE (t) == SSA_NAME)
1089     return t;
1090
1091   if (!BINARY_CLASS_P (t))
1092     return NULL;
1093
1094   switch (TREE_OPERAND_LENGTH (t))
1095     {
1096     case 1:
1097       return strips_small_constant (TREE_OPERAND (t, 0), NULL);
1098     case 2:
1099       return strips_small_constant (TREE_OPERAND (t, 0),
1100                                     TREE_OPERAND (t, 1));
1101     default:
1102       return NULL;
1103     }
1104 }
1105
1106 /* Check the compare STMT in LOOP. If it compares an induction
1107    variable to a loop invariant, return true, and save
1108    LOOP_INVARIANT, COMPARE_CODE and LOOP_STEP.
1109    Otherwise return false and set LOOP_INVAIANT to NULL.  */
1110
1111 static bool
1112 is_comparison_with_loop_invariant_p (gimple stmt, struct loop *loop,
1113                                      tree *loop_invariant,
1114                                      enum tree_code *compare_code,
1115                                      tree *loop_step,
1116                                      tree *loop_iv_base)
1117 {
1118   tree op0, op1, bound, base;
1119   affine_iv iv0, iv1;
1120   enum tree_code code;
1121   tree step;
1122
1123   code = gimple_cond_code (stmt);
1124   *loop_invariant = NULL;
1125
1126   switch (code)
1127     {
1128     case GT_EXPR:
1129     case GE_EXPR:
1130     case NE_EXPR:
1131     case LT_EXPR:
1132     case LE_EXPR:
1133     case EQ_EXPR:
1134       break;
1135
1136     default:
1137       return false;
1138     }
1139
1140   op0 = gimple_cond_lhs (stmt);
1141   op1 = gimple_cond_rhs (stmt);
1142
1143   if ((TREE_CODE (op0) != SSA_NAME && TREE_CODE (op0) != INTEGER_CST)
1144        || (TREE_CODE (op1) != SSA_NAME && TREE_CODE (op1) != INTEGER_CST))
1145     return false;
1146   if (!simple_iv (loop, loop_containing_stmt (stmt), op0, &iv0, true))
1147     return false;
1148   if (!simple_iv (loop, loop_containing_stmt (stmt), op1, &iv1, true))
1149     return false;
1150   if (TREE_CODE (iv0.step) != INTEGER_CST
1151       || TREE_CODE (iv1.step) != INTEGER_CST)
1152     return false;
1153   if ((integer_zerop (iv0.step) && integer_zerop (iv1.step))
1154       || (!integer_zerop (iv0.step) && !integer_zerop (iv1.step)))
1155     return false;
1156
1157   if (integer_zerop (iv0.step))
1158     {
1159       if (code != NE_EXPR && code != EQ_EXPR)
1160         code = invert_tree_comparison (code, false);
1161       bound = iv0.base;
1162       base = iv1.base;
1163       if (tree_fits_shwi_p (iv1.step))
1164         step = iv1.step;
1165       else
1166         return false;
1167     }
1168   else
1169     {
1170       bound = iv1.base;
1171       base = iv0.base;
1172       if (tree_fits_shwi_p (iv0.step))
1173         step = iv0.step;
1174       else
1175         return false;
1176     }
1177
1178   if (TREE_CODE (bound) != INTEGER_CST)
1179     bound = get_base_value (bound);
1180   if (!bound)
1181     return false;
1182   if (TREE_CODE (base) != INTEGER_CST)
1183     base = get_base_value (base);
1184   if (!base)
1185     return false;
1186
1187   *loop_invariant = bound;
1188   *compare_code = code;
1189   *loop_step = step;
1190   *loop_iv_base = base;
1191   return true;
1192 }
1193
1194 /* Compare two SSA_NAMEs: returns TRUE if T1 and T2 are value coherent.  */
1195
1196 static bool
1197 expr_coherent_p (tree t1, tree t2)
1198 {
1199   gimple stmt;
1200   tree ssa_name_1 = NULL;
1201   tree ssa_name_2 = NULL;
1202
1203   gcc_assert (TREE_CODE (t1) == SSA_NAME || TREE_CODE (t1) == INTEGER_CST);
1204   gcc_assert (TREE_CODE (t2) == SSA_NAME || TREE_CODE (t2) == INTEGER_CST);
1205
1206   if (t1 == t2)
1207     return true;
1208
1209   if (TREE_CODE (t1) == INTEGER_CST && TREE_CODE (t2) == INTEGER_CST)
1210     return true;
1211   if (TREE_CODE (t1) == INTEGER_CST || TREE_CODE (t2) == INTEGER_CST)
1212     return false;
1213
1214   /* Check to see if t1 is expressed/defined with t2.  */
1215   stmt = SSA_NAME_DEF_STMT (t1);
1216   gcc_assert (stmt != NULL);
1217   if (is_gimple_assign (stmt))
1218     {
1219       ssa_name_1 = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
1220       if (ssa_name_1 && ssa_name_1 == t2)
1221         return true;
1222     }
1223
1224   /* Check to see if t2 is expressed/defined with t1.  */
1225   stmt = SSA_NAME_DEF_STMT (t2);
1226   gcc_assert (stmt != NULL);
1227   if (is_gimple_assign (stmt))
1228     {
1229       ssa_name_2 = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
1230       if (ssa_name_2 && ssa_name_2 == t1)
1231         return true;
1232     }
1233
1234   /* Compare if t1 and t2's def_stmts are identical.  */
1235   if (ssa_name_2 != NULL && ssa_name_1 == ssa_name_2)
1236     return true;
1237   else
1238     return false;
1239 }
1240
1241 /* Predict branch probability of BB when BB contains a branch that compares
1242    an induction variable in LOOP with LOOP_IV_BASE_VAR to LOOP_BOUND_VAR. The
1243    loop exit is compared using LOOP_BOUND_CODE, with step of LOOP_BOUND_STEP.
1244
1245    E.g.
1246      for (int i = 0; i < bound; i++) {
1247        if (i < bound - 2)
1248          computation_1();
1249        else
1250          computation_2();
1251      }
1252
1253   In this loop, we will predict the branch inside the loop to be taken.  */
1254
1255 static void
1256 predict_iv_comparison (struct loop *loop, basic_block bb,
1257                        tree loop_bound_var,
1258                        tree loop_iv_base_var,
1259                        enum tree_code loop_bound_code,
1260                        int loop_bound_step)
1261 {
1262   gimple stmt;
1263   tree compare_var, compare_base;
1264   enum tree_code compare_code;
1265   tree compare_step_var;
1266   edge then_edge;
1267   edge_iterator ei;
1268
1269   if (predicted_by_p (bb, PRED_LOOP_ITERATIONS_GUESSED)
1270       || predicted_by_p (bb, PRED_LOOP_ITERATIONS)
1271       || predicted_by_p (bb, PRED_LOOP_EXIT))
1272     return;
1273
1274   stmt = last_stmt (bb);
1275   if (!stmt || gimple_code (stmt) != GIMPLE_COND)
1276     return;
1277   if (!is_comparison_with_loop_invariant_p (stmt, loop, &compare_var,
1278                                             &compare_code,
1279                                             &compare_step_var,
1280                                             &compare_base))
1281     return;
1282
1283   /* Find the taken edge.  */
1284   FOR_EACH_EDGE (then_edge, ei, bb->succs)
1285     if (then_edge->flags & EDGE_TRUE_VALUE)
1286       break;
1287
1288   /* When comparing an IV to a loop invariant, NE is more likely to be
1289      taken while EQ is more likely to be not-taken.  */
1290   if (compare_code == NE_EXPR)
1291     {
1292       predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1293       return;
1294     }
1295   else if (compare_code == EQ_EXPR)
1296     {
1297       predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1298       return;
1299     }
1300
1301   if (!expr_coherent_p (loop_iv_base_var, compare_base))
1302     return;
1303
1304   /* If loop bound, base and compare bound are all constants, we can
1305      calculate the probability directly.  */
1306   if (tree_fits_shwi_p (loop_bound_var)
1307       && tree_fits_shwi_p (compare_var)
1308       && tree_fits_shwi_p (compare_base))
1309     {
1310       int probability;
1311       bool of, overflow = false;
1312       double_int mod, compare_count, tem, loop_count;
1313
1314       double_int loop_bound = tree_to_double_int (loop_bound_var);
1315       double_int compare_bound = tree_to_double_int (compare_var);
1316       double_int base = tree_to_double_int (compare_base);
1317       double_int compare_step = tree_to_double_int (compare_step_var);
1318
1319       /* (loop_bound - base) / compare_step */
1320       tem = loop_bound.sub_with_overflow (base, &of);
1321       overflow |= of;
1322       loop_count = tem.divmod_with_overflow (compare_step,
1323                                               0, TRUNC_DIV_EXPR,
1324                                               &mod, &of);
1325       overflow |= of;
1326
1327       if ((!compare_step.is_negative ())
1328           ^ (compare_code == LT_EXPR || compare_code == LE_EXPR))
1329         {
1330           /* (loop_bound - compare_bound) / compare_step */
1331           tem = loop_bound.sub_with_overflow (compare_bound, &of);
1332           overflow |= of;
1333           compare_count = tem.divmod_with_overflow (compare_step,
1334                                                      0, TRUNC_DIV_EXPR,
1335                                                      &mod, &of);
1336           overflow |= of;
1337         }
1338       else
1339         {
1340           /* (compare_bound - base) / compare_step */
1341           tem = compare_bound.sub_with_overflow (base, &of);
1342           overflow |= of;
1343           compare_count = tem.divmod_with_overflow (compare_step,
1344                                                      0, TRUNC_DIV_EXPR,
1345                                                      &mod, &of);
1346           overflow |= of;
1347         }
1348       if (compare_code == LE_EXPR || compare_code == GE_EXPR)
1349         ++compare_count;
1350       if (loop_bound_code == LE_EXPR || loop_bound_code == GE_EXPR)
1351         ++loop_count;
1352       if (compare_count.is_negative ())
1353         compare_count = double_int_zero;
1354       if (loop_count.is_negative ())
1355         loop_count = double_int_zero;
1356       if (loop_count.is_zero ())
1357         probability = 0;
1358       else if (compare_count.scmp (loop_count) == 1)
1359         probability = REG_BR_PROB_BASE;
1360       else
1361         {
1362           /* If loop_count is too big, such that REG_BR_PROB_BASE * loop_count
1363              could overflow, shift both loop_count and compare_count right
1364              a bit so that it doesn't overflow.  Note both counts are known not
1365              to be negative at this point.  */
1366           int clz_bits = clz_hwi (loop_count.high);
1367           gcc_assert (REG_BR_PROB_BASE < 32768);
1368           if (clz_bits < 16)
1369             {
1370               loop_count.arshift (16 - clz_bits, HOST_BITS_PER_DOUBLE_INT);
1371               compare_count.arshift (16 - clz_bits, HOST_BITS_PER_DOUBLE_INT);
1372             }
1373           tem = compare_count.mul_with_sign (double_int::from_shwi
1374                                             (REG_BR_PROB_BASE), true, &of);
1375           gcc_assert (!of);
1376           tem = tem.divmod (loop_count, true, TRUNC_DIV_EXPR, &mod);
1377           probability = tem.to_uhwi ();
1378         }
1379
1380       if (!overflow)
1381         predict_edge (then_edge, PRED_LOOP_IV_COMPARE, probability);
1382
1383       return;
1384     }
1385
1386   if (expr_coherent_p (loop_bound_var, compare_var))
1387     {
1388       if ((loop_bound_code == LT_EXPR || loop_bound_code == LE_EXPR)
1389           && (compare_code == LT_EXPR || compare_code == LE_EXPR))
1390         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1391       else if ((loop_bound_code == GT_EXPR || loop_bound_code == GE_EXPR)
1392                && (compare_code == GT_EXPR || compare_code == GE_EXPR))
1393         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1394       else if (loop_bound_code == NE_EXPR)
1395         {
1396           /* If the loop backedge condition is "(i != bound)", we do
1397              the comparison based on the step of IV:
1398              * step < 0 : backedge condition is like (i > bound)
1399              * step > 0 : backedge condition is like (i < bound)  */
1400           gcc_assert (loop_bound_step != 0);
1401           if (loop_bound_step > 0
1402               && (compare_code == LT_EXPR
1403                   || compare_code == LE_EXPR))
1404             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1405           else if (loop_bound_step < 0
1406                    && (compare_code == GT_EXPR
1407                        || compare_code == GE_EXPR))
1408             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1409           else
1410             predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1411         }
1412       else
1413         /* The branch is predicted not-taken if loop_bound_code is
1414            opposite with compare_code.  */
1415         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1416     }
1417   else if (expr_coherent_p (loop_iv_base_var, compare_var))
1418     {
1419       /* For cases like:
1420            for (i = s; i < h; i++)
1421              if (i > s + 2) ....
1422          The branch should be predicted taken.  */
1423       if (loop_bound_step > 0
1424           && (compare_code == GT_EXPR || compare_code == GE_EXPR))
1425         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1426       else if (loop_bound_step < 0
1427                && (compare_code == LT_EXPR || compare_code == LE_EXPR))
1428         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, TAKEN);
1429       else
1430         predict_edge_def (then_edge, PRED_LOOP_IV_COMPARE_GUESS, NOT_TAKEN);
1431     }
1432 }
1433
1434 /* Predict for extra loop exits that will lead to EXIT_EDGE. The extra loop
1435    exits are resulted from short-circuit conditions that will generate an
1436    if_tmp. E.g.:
1437
1438    if (foo() || global > 10)
1439      break;
1440
1441    This will be translated into:
1442
1443    BB3:
1444      loop header...
1445    BB4:
1446      if foo() goto BB6 else goto BB5
1447    BB5:
1448      if global > 10 goto BB6 else goto BB7
1449    BB6:
1450      goto BB7
1451    BB7:
1452      iftmp = (PHI 0(BB5), 1(BB6))
1453      if iftmp == 1 goto BB8 else goto BB3
1454    BB8:
1455      outside of the loop...
1456
1457    The edge BB7->BB8 is loop exit because BB8 is outside of the loop.
1458    From the dataflow, we can infer that BB4->BB6 and BB5->BB6 are also loop
1459    exits. This function takes BB7->BB8 as input, and finds out the extra loop
1460    exits to predict them using PRED_LOOP_EXIT.  */
1461
1462 static void
1463 predict_extra_loop_exits (edge exit_edge)
1464 {
1465   unsigned i;
1466   bool check_value_one;
1467   gimple phi_stmt;
1468   tree cmp_rhs, cmp_lhs;
1469   gimple cmp_stmt = last_stmt (exit_edge->src);
1470
1471   if (!cmp_stmt || gimple_code (cmp_stmt) != GIMPLE_COND)
1472     return;
1473   cmp_rhs = gimple_cond_rhs (cmp_stmt);
1474   cmp_lhs = gimple_cond_lhs (cmp_stmt);
1475   if (!TREE_CONSTANT (cmp_rhs)
1476       || !(integer_zerop (cmp_rhs) || integer_onep (cmp_rhs)))
1477     return;
1478   if (TREE_CODE (cmp_lhs) != SSA_NAME)
1479     return;
1480
1481   /* If check_value_one is true, only the phi_args with value '1' will lead
1482      to loop exit. Otherwise, only the phi_args with value '0' will lead to
1483      loop exit.  */
1484   check_value_one = (((integer_onep (cmp_rhs))
1485                     ^ (gimple_cond_code (cmp_stmt) == EQ_EXPR))
1486                     ^ ((exit_edge->flags & EDGE_TRUE_VALUE) != 0));
1487
1488   phi_stmt = SSA_NAME_DEF_STMT (cmp_lhs);
1489   if (!phi_stmt || gimple_code (phi_stmt) != GIMPLE_PHI)
1490     return;
1491
1492   for (i = 0; i < gimple_phi_num_args (phi_stmt); i++)
1493     {
1494       edge e1;
1495       edge_iterator ei;
1496       tree val = gimple_phi_arg_def (phi_stmt, i);
1497       edge e = gimple_phi_arg_edge (phi_stmt, i);
1498
1499       if (!TREE_CONSTANT (val) || !(integer_zerop (val) || integer_onep (val)))
1500         continue;
1501       if ((check_value_one ^ integer_onep (val)) == 1)
1502         continue;
1503       if (EDGE_COUNT (e->src->succs) != 1)
1504         {
1505           predict_paths_leading_to_edge (e, PRED_LOOP_EXIT, NOT_TAKEN);
1506           continue;
1507         }
1508
1509       FOR_EACH_EDGE (e1, ei, e->src->preds)
1510         predict_paths_leading_to_edge (e1, PRED_LOOP_EXIT, NOT_TAKEN);
1511     }
1512 }
1513
1514 /* Predict edge probabilities by exploiting loop structure.  */
1515
1516 static void
1517 predict_loops (void)
1518 {
1519   struct loop *loop;
1520
1521   /* Try to predict out blocks in a loop that are not part of a
1522      natural loop.  */
1523   FOR_EACH_LOOP (loop, 0)
1524     {
1525       basic_block bb, *bbs;
1526       unsigned j, n_exits;
1527       vec<edge> exits;
1528       struct tree_niter_desc niter_desc;
1529       edge ex;
1530       struct nb_iter_bound *nb_iter;
1531       enum tree_code loop_bound_code = ERROR_MARK;
1532       tree loop_bound_step = NULL;
1533       tree loop_bound_var = NULL;
1534       tree loop_iv_base = NULL;
1535       gimple stmt = NULL;
1536
1537       exits = get_loop_exit_edges (loop);
1538       n_exits = exits.length ();
1539       if (!n_exits)
1540         {
1541           exits.release ();
1542           continue;
1543         }
1544
1545       FOR_EACH_VEC_ELT (exits, j, ex)
1546         {
1547           tree niter = NULL;
1548           HOST_WIDE_INT nitercst;
1549           int max = PARAM_VALUE (PARAM_MAX_PREDICTED_ITERATIONS);
1550           int probability;
1551           enum br_predictor predictor;
1552
1553           predict_extra_loop_exits (ex);
1554
1555           if (number_of_iterations_exit (loop, ex, &niter_desc, false, false))
1556             niter = niter_desc.niter;
1557           if (!niter || TREE_CODE (niter_desc.niter) != INTEGER_CST)
1558             niter = loop_niter_by_eval (loop, ex);
1559
1560           if (TREE_CODE (niter) == INTEGER_CST)
1561             {
1562               if (tree_fits_uhwi_p (niter)
1563                   && max
1564                   && compare_tree_int (niter, max - 1) == -1)
1565                 nitercst = tree_to_uhwi (niter) + 1;
1566               else
1567                 nitercst = max;
1568               predictor = PRED_LOOP_ITERATIONS;
1569             }
1570           /* If we have just one exit and we can derive some information about
1571              the number of iterations of the loop from the statements inside
1572              the loop, use it to predict this exit.  */
1573           else if (n_exits == 1)
1574             {
1575               nitercst = estimated_stmt_executions_int (loop);
1576               if (nitercst < 0)
1577                 continue;
1578               if (nitercst > max)
1579                 nitercst = max;
1580
1581               predictor = PRED_LOOP_ITERATIONS_GUESSED;
1582             }
1583           else
1584             continue;
1585
1586           /* If the prediction for number of iterations is zero, do not
1587              predict the exit edges.  */
1588           if (nitercst == 0)
1589             continue;
1590
1591           probability = ((REG_BR_PROB_BASE + nitercst / 2) / nitercst);
1592           predict_edge (ex, predictor, probability);
1593         }
1594       exits.release ();
1595
1596       /* Find information about loop bound variables.  */
1597       for (nb_iter = loop->bounds; nb_iter;
1598            nb_iter = nb_iter->next)
1599         if (nb_iter->stmt
1600             && gimple_code (nb_iter->stmt) == GIMPLE_COND)
1601           {
1602             stmt = nb_iter->stmt;
1603             break;
1604           }
1605       if (!stmt && last_stmt (loop->header)
1606           && gimple_code (last_stmt (loop->header)) == GIMPLE_COND)
1607         stmt = last_stmt (loop->header);
1608       if (stmt)
1609         is_comparison_with_loop_invariant_p (stmt, loop,
1610                                              &loop_bound_var,
1611                                              &loop_bound_code,
1612                                              &loop_bound_step,
1613                                              &loop_iv_base);
1614
1615       bbs = get_loop_body (loop);
1616
1617       for (j = 0; j < loop->num_nodes; j++)
1618         {
1619           int header_found = 0;
1620           edge e;
1621           edge_iterator ei;
1622
1623           bb = bbs[j];
1624
1625           /* Bypass loop heuristics on continue statement.  These
1626              statements construct loops via "non-loop" constructs
1627              in the source language and are better to be handled
1628              separately.  */
1629           if (predicted_by_p (bb, PRED_CONTINUE))
1630             continue;
1631
1632           /* Loop branch heuristics - predict an edge back to a
1633              loop's head as taken.  */
1634           if (bb == loop->latch)
1635             {
1636               e = find_edge (loop->latch, loop->header);
1637               if (e)
1638                 {
1639                   header_found = 1;
1640                   predict_edge_def (e, PRED_LOOP_BRANCH, TAKEN);
1641                 }
1642             }
1643
1644           /* Loop exit heuristics - predict an edge exiting the loop if the
1645              conditional has no loop header successors as not taken.  */
1646           if (!header_found
1647               /* If we already used more reliable loop exit predictors, do not
1648                  bother with PRED_LOOP_EXIT.  */
1649               && !predicted_by_p (bb, PRED_LOOP_ITERATIONS_GUESSED)
1650               && !predicted_by_p (bb, PRED_LOOP_ITERATIONS))
1651             {
1652               /* For loop with many exits we don't want to predict all exits
1653                  with the pretty large probability, because if all exits are
1654                  considered in row, the loop would be predicted to iterate
1655                  almost never.  The code to divide probability by number of
1656                  exits is very rough.  It should compute the number of exits
1657                  taken in each patch through function (not the overall number
1658                  of exits that might be a lot higher for loops with wide switch
1659                  statements in them) and compute n-th square root.
1660
1661                  We limit the minimal probability by 2% to avoid
1662                  EDGE_PROBABILITY_RELIABLE from trusting the branch prediction
1663                  as this was causing regression in perl benchmark containing such
1664                  a wide loop.  */
1665
1666               int probability = ((REG_BR_PROB_BASE
1667                                   - predictor_info [(int) PRED_LOOP_EXIT].hitrate)
1668                                  / n_exits);
1669               if (probability < HITRATE (2))
1670                 probability = HITRATE (2);
1671               FOR_EACH_EDGE (e, ei, bb->succs)
1672                 if (e->dest->index < NUM_FIXED_BLOCKS
1673                     || !flow_bb_inside_loop_p (loop, e->dest))
1674                   predict_edge (e, PRED_LOOP_EXIT, probability);
1675             }
1676           if (loop_bound_var)
1677             predict_iv_comparison (loop, bb, loop_bound_var, loop_iv_base,
1678                                    loop_bound_code,
1679                                    tree_to_shwi (loop_bound_step));
1680         }
1681
1682       /* Free basic blocks from get_loop_body.  */
1683       free (bbs);
1684     }
1685 }
1686
1687 /* Attempt to predict probabilities of BB outgoing edges using local
1688    properties.  */
1689 static void
1690 bb_estimate_probability_locally (basic_block bb)
1691 {
1692   rtx last_insn = BB_END (bb);
1693   rtx cond;
1694
1695   if (! can_predict_insn_p (last_insn))
1696     return;
1697   cond = get_condition (last_insn, NULL, false, false);
1698   if (! cond)
1699     return;
1700
1701   /* Try "pointer heuristic."
1702      A comparison ptr == 0 is predicted as false.
1703      Similarly, a comparison ptr1 == ptr2 is predicted as false.  */
1704   if (COMPARISON_P (cond)
1705       && ((REG_P (XEXP (cond, 0)) && REG_POINTER (XEXP (cond, 0)))
1706           || (REG_P (XEXP (cond, 1)) && REG_POINTER (XEXP (cond, 1)))))
1707     {
1708       if (GET_CODE (cond) == EQ)
1709         predict_insn_def (last_insn, PRED_POINTER, NOT_TAKEN);
1710       else if (GET_CODE (cond) == NE)
1711         predict_insn_def (last_insn, PRED_POINTER, TAKEN);
1712     }
1713   else
1714
1715   /* Try "opcode heuristic."
1716      EQ tests are usually false and NE tests are usually true. Also,
1717      most quantities are positive, so we can make the appropriate guesses
1718      about signed comparisons against zero.  */
1719     switch (GET_CODE (cond))
1720       {
1721       case CONST_INT:
1722         /* Unconditional branch.  */
1723         predict_insn_def (last_insn, PRED_UNCONDITIONAL,
1724                           cond == const0_rtx ? NOT_TAKEN : TAKEN);
1725         break;
1726
1727       case EQ:
1728       case UNEQ:
1729         /* Floating point comparisons appears to behave in a very
1730            unpredictable way because of special role of = tests in
1731            FP code.  */
1732         if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
1733           ;
1734         /* Comparisons with 0 are often used for booleans and there is
1735            nothing useful to predict about them.  */
1736         else if (XEXP (cond, 1) == const0_rtx
1737                  || XEXP (cond, 0) == const0_rtx)
1738           ;
1739         else
1740           predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, NOT_TAKEN);
1741         break;
1742
1743       case NE:
1744       case LTGT:
1745         /* Floating point comparisons appears to behave in a very
1746            unpredictable way because of special role of = tests in
1747            FP code.  */
1748         if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
1749           ;
1750         /* Comparisons with 0 are often used for booleans and there is
1751            nothing useful to predict about them.  */
1752         else if (XEXP (cond, 1) == const0_rtx
1753                  || XEXP (cond, 0) == const0_rtx)
1754           ;
1755         else
1756           predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, TAKEN);
1757         break;
1758
1759       case ORDERED:
1760         predict_insn_def (last_insn, PRED_FPOPCODE, TAKEN);
1761         break;
1762
1763       case UNORDERED:
1764         predict_insn_def (last_insn, PRED_FPOPCODE, NOT_TAKEN);
1765         break;
1766
1767       case LE:
1768       case LT:
1769         if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
1770             || XEXP (cond, 1) == constm1_rtx)
1771           predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, NOT_TAKEN);
1772         break;
1773
1774       case GE:
1775       case GT:
1776         if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
1777             || XEXP (cond, 1) == constm1_rtx)
1778           predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, TAKEN);
1779         break;
1780
1781       default:
1782         break;
1783       }
1784 }
1785
1786 /* Set edge->probability for each successor edge of BB.  */
1787 void
1788 guess_outgoing_edge_probabilities (basic_block bb)
1789 {
1790   bb_estimate_probability_locally (bb);
1791   combine_predictions_for_insn (BB_END (bb), bb);
1792 }
1793 \f
1794 static tree expr_expected_value (tree, bitmap, enum br_predictor *predictor);
1795
1796 /* Helper function for expr_expected_value.  */
1797
1798 static tree
1799 expr_expected_value_1 (tree type, tree op0, enum tree_code code,
1800                        tree op1, bitmap visited, enum br_predictor *predictor)
1801 {
1802   gimple def;
1803
1804   if (predictor)
1805     *predictor = PRED_UNCONDITIONAL;
1806
1807   if (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS)
1808     {
1809       if (TREE_CONSTANT (op0))
1810         return op0;
1811
1812       if (code != SSA_NAME)
1813         return NULL_TREE;
1814
1815       def = SSA_NAME_DEF_STMT (op0);
1816
1817       /* If we were already here, break the infinite cycle.  */
1818       if (!bitmap_set_bit (visited, SSA_NAME_VERSION (op0)))
1819         return NULL;
1820
1821       if (gimple_code (def) == GIMPLE_PHI)
1822         {
1823           /* All the arguments of the PHI node must have the same constant
1824              length.  */
1825           int i, n = gimple_phi_num_args (def);
1826           tree val = NULL, new_val;
1827
1828           for (i = 0; i < n; i++)
1829             {
1830               tree arg = PHI_ARG_DEF (def, i);
1831               enum br_predictor predictor2;
1832
1833               /* If this PHI has itself as an argument, we cannot
1834                  determine the string length of this argument.  However,
1835                  if we can find an expected constant value for the other
1836                  PHI args then we can still be sure that this is
1837                  likely a constant.  So be optimistic and just
1838                  continue with the next argument.  */
1839               if (arg == PHI_RESULT (def))
1840                 continue;
1841
1842               new_val = expr_expected_value (arg, visited, &predictor2);
1843
1844               /* It is difficult to combine value predictors.  Simply assume
1845                  that later predictor is weaker and take its prediction.  */
1846               if (predictor && *predictor < predictor2)
1847                 *predictor = predictor2;
1848               if (!new_val)
1849                 return NULL;
1850               if (!val)
1851                 val = new_val;
1852               else if (!operand_equal_p (val, new_val, false))
1853                 return NULL;
1854             }
1855           return val;
1856         }
1857       if (is_gimple_assign (def))
1858         {
1859           if (gimple_assign_lhs (def) != op0)
1860             return NULL;
1861
1862           return expr_expected_value_1 (TREE_TYPE (gimple_assign_lhs (def)),
1863                                         gimple_assign_rhs1 (def),
1864                                         gimple_assign_rhs_code (def),
1865                                         gimple_assign_rhs2 (def),
1866                                         visited, predictor);
1867         }
1868
1869       if (is_gimple_call (def))
1870         {
1871           tree decl = gimple_call_fndecl (def);
1872           if (!decl)
1873             {
1874               if (gimple_call_internal_p (def)
1875                   && gimple_call_internal_fn (def) == IFN_BUILTIN_EXPECT)
1876                 {
1877                   gcc_assert (gimple_call_num_args (def) == 3);
1878                   tree val = gimple_call_arg (def, 0);
1879                   if (TREE_CONSTANT (val))
1880                     return val;
1881                   if (predictor)
1882                     {
1883                       *predictor = PRED_BUILTIN_EXPECT;
1884                       tree val2 = gimple_call_arg (def, 2);
1885                       gcc_assert (TREE_CODE (val2) == INTEGER_CST
1886                                   && tree_fits_uhwi_p (val2)
1887                                   && tree_to_uhwi (val2) < END_PREDICTORS);
1888                       *predictor = (enum br_predictor) tree_to_uhwi (val2);
1889                     }
1890                   return gimple_call_arg (def, 1);
1891                 }
1892               return NULL;
1893             }
1894           if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
1895             switch (DECL_FUNCTION_CODE (decl))
1896               {
1897               case BUILT_IN_EXPECT:
1898                 {
1899                   tree val;
1900                   if (gimple_call_num_args (def) != 2)
1901                     return NULL;
1902                   val = gimple_call_arg (def, 0);
1903                   if (TREE_CONSTANT (val))
1904                     return val;
1905                   if (predictor)
1906                     *predictor = PRED_BUILTIN_EXPECT;
1907                   return gimple_call_arg (def, 1);
1908                 }
1909
1910               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_N:
1911               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_1:
1912               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_2:
1913               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_4:
1914               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_8:
1915               case BUILT_IN_SYNC_BOOL_COMPARE_AND_SWAP_16:
1916               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE:
1917               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_N:
1918               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_1:
1919               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_2:
1920               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_4:
1921               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_8:
1922               case BUILT_IN_ATOMIC_COMPARE_EXCHANGE_16:
1923                 /* Assume that any given atomic operation has low contention,
1924                    and thus the compare-and-swap operation succeeds.  */
1925                 if (predictor)
1926                   *predictor = PRED_COMPARE_AND_SWAP;
1927                 return boolean_true_node;
1928             }
1929         }
1930
1931       return NULL;
1932     }
1933
1934   if (get_gimple_rhs_class (code) == GIMPLE_BINARY_RHS)
1935     {
1936       tree res;
1937       enum br_predictor predictor2;
1938       op0 = expr_expected_value (op0, visited, predictor);
1939       if (!op0)
1940         return NULL;
1941       op1 = expr_expected_value (op1, visited, &predictor2);
1942       if (predictor && *predictor < predictor2)
1943         *predictor = predictor2;
1944       if (!op1)
1945         return NULL;
1946       res = fold_build2 (code, type, op0, op1);
1947       if (TREE_CONSTANT (res))
1948         return res;
1949       return NULL;
1950     }
1951   if (get_gimple_rhs_class (code) == GIMPLE_UNARY_RHS)
1952     {
1953       tree res;
1954       op0 = expr_expected_value (op0, visited, predictor);
1955       if (!op0)
1956         return NULL;
1957       res = fold_build1 (code, type, op0);
1958       if (TREE_CONSTANT (res))
1959         return res;
1960       return NULL;
1961     }
1962   return NULL;
1963 }
1964
1965 /* Return constant EXPR will likely have at execution time, NULL if unknown.
1966    The function is used by builtin_expect branch predictor so the evidence
1967    must come from this construct and additional possible constant folding.
1968
1969    We may want to implement more involved value guess (such as value range
1970    propagation based prediction), but such tricks shall go to new
1971    implementation.  */
1972
1973 static tree
1974 expr_expected_value (tree expr, bitmap visited,
1975                      enum br_predictor *predictor)
1976 {
1977   enum tree_code code;
1978   tree op0, op1;
1979
1980   if (TREE_CONSTANT (expr))
1981     {
1982       if (predictor)
1983         *predictor = PRED_UNCONDITIONAL;
1984       return expr;
1985     }
1986
1987   extract_ops_from_tree (expr, &code, &op0, &op1);
1988   return expr_expected_value_1 (TREE_TYPE (expr),
1989                                 op0, code, op1, visited, predictor);
1990 }
1991
1992 \f
1993 /* Get rid of all builtin_expect calls and GIMPLE_PREDICT statements
1994    we no longer need.  */
1995 static unsigned int
1996 strip_predict_hints (void)
1997 {
1998   basic_block bb;
1999   gimple ass_stmt;
2000   tree var;
2001
2002   FOR_EACH_BB_FN (bb, cfun)
2003     {
2004       gimple_stmt_iterator bi;
2005       for (bi = gsi_start_bb (bb); !gsi_end_p (bi);)
2006         {
2007           gimple stmt = gsi_stmt (bi);
2008
2009           if (gimple_code (stmt) == GIMPLE_PREDICT)
2010             {
2011               gsi_remove (&bi, true);
2012               continue;
2013             }
2014           else if (is_gimple_call (stmt))
2015             {
2016               tree fndecl = gimple_call_fndecl (stmt);
2017
2018               if ((fndecl
2019                    && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL
2020                    && DECL_FUNCTION_CODE (fndecl) == BUILT_IN_EXPECT
2021                    && gimple_call_num_args (stmt) == 2)
2022                   || (gimple_call_internal_p (stmt)
2023                       && gimple_call_internal_fn (stmt) == IFN_BUILTIN_EXPECT))
2024                 {
2025                   var = gimple_call_lhs (stmt);
2026                   if (var)
2027                     {
2028                       ass_stmt
2029                         = gimple_build_assign (var, gimple_call_arg (stmt, 0));
2030                       gsi_replace (&bi, ass_stmt, true);
2031                     }
2032                   else
2033                     {
2034                       gsi_remove (&bi, true);
2035                       continue;
2036                     }
2037                 }
2038             }
2039           gsi_next (&bi);
2040         }
2041     }
2042   return 0;
2043 }
2044 \f
2045 /* Predict using opcode of the last statement in basic block.  */
2046 static void
2047 tree_predict_by_opcode (basic_block bb)
2048 {
2049   gimple stmt = last_stmt (bb);
2050   edge then_edge;
2051   tree op0, op1;
2052   tree type;
2053   tree val;
2054   enum tree_code cmp;
2055   bitmap visited;
2056   edge_iterator ei;
2057   enum br_predictor predictor;
2058
2059   if (!stmt || gimple_code (stmt) != GIMPLE_COND)
2060     return;
2061   FOR_EACH_EDGE (then_edge, ei, bb->succs)
2062     if (then_edge->flags & EDGE_TRUE_VALUE)
2063       break;
2064   op0 = gimple_cond_lhs (stmt);
2065   op1 = gimple_cond_rhs (stmt);
2066   cmp = gimple_cond_code (stmt);
2067   type = TREE_TYPE (op0);
2068   visited = BITMAP_ALLOC (NULL);
2069   val = expr_expected_value_1 (boolean_type_node, op0, cmp, op1, visited,
2070                                &predictor);
2071   BITMAP_FREE (visited);
2072   if (val && TREE_CODE (val) == INTEGER_CST)
2073     {
2074       if (predictor == PRED_BUILTIN_EXPECT)
2075         {
2076           int percent = PARAM_VALUE (BUILTIN_EXPECT_PROBABILITY);
2077
2078           gcc_assert (percent >= 0 && percent <= 100);
2079           if (integer_zerop (val))
2080             percent = 100 - percent;
2081           predict_edge (then_edge, PRED_BUILTIN_EXPECT, HITRATE (percent));
2082         }
2083       else
2084         predict_edge (then_edge, predictor,
2085                       integer_zerop (val) ? NOT_TAKEN : TAKEN);
2086     }
2087   /* Try "pointer heuristic."
2088      A comparison ptr == 0 is predicted as false.
2089      Similarly, a comparison ptr1 == ptr2 is predicted as false.  */
2090   if (POINTER_TYPE_P (type))
2091     {
2092       if (cmp == EQ_EXPR)
2093         predict_edge_def (then_edge, PRED_TREE_POINTER, NOT_TAKEN);
2094       else if (cmp == NE_EXPR)
2095         predict_edge_def (then_edge, PRED_TREE_POINTER, TAKEN);
2096     }
2097   else
2098
2099   /* Try "opcode heuristic."
2100      EQ tests are usually false and NE tests are usually true. Also,
2101      most quantities are positive, so we can make the appropriate guesses
2102      about signed comparisons against zero.  */
2103     switch (cmp)
2104       {
2105       case EQ_EXPR:
2106       case UNEQ_EXPR:
2107         /* Floating point comparisons appears to behave in a very
2108            unpredictable way because of special role of = tests in
2109            FP code.  */
2110         if (FLOAT_TYPE_P (type))
2111           ;
2112         /* Comparisons with 0 are often used for booleans and there is
2113            nothing useful to predict about them.  */
2114         else if (integer_zerop (op0) || integer_zerop (op1))
2115           ;
2116         else
2117           predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, NOT_TAKEN);
2118         break;
2119
2120       case NE_EXPR:
2121       case LTGT_EXPR:
2122         /* Floating point comparisons appears to behave in a very
2123            unpredictable way because of special role of = tests in
2124            FP code.  */
2125         if (FLOAT_TYPE_P (type))
2126           ;
2127         /* Comparisons with 0 are often used for booleans and there is
2128            nothing useful to predict about them.  */
2129         else if (integer_zerop (op0)
2130                  || integer_zerop (op1))
2131           ;
2132         else
2133           predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, TAKEN);
2134         break;
2135
2136       case ORDERED_EXPR:
2137         predict_edge_def (then_edge, PRED_TREE_FPOPCODE, TAKEN);
2138         break;
2139
2140       case UNORDERED_EXPR:
2141         predict_edge_def (then_edge, PRED_TREE_FPOPCODE, NOT_TAKEN);
2142         break;
2143
2144       case LE_EXPR:
2145       case LT_EXPR:
2146         if (integer_zerop (op1)
2147             || integer_onep (op1)
2148             || integer_all_onesp (op1)
2149             || real_zerop (op1)
2150             || real_onep (op1)
2151             || real_minus_onep (op1))
2152           predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, NOT_TAKEN);
2153         break;
2154
2155       case GE_EXPR:
2156       case GT_EXPR:
2157         if (integer_zerop (op1)
2158             || integer_onep (op1)
2159             || integer_all_onesp (op1)
2160             || real_zerop (op1)
2161             || real_onep (op1)
2162             || real_minus_onep (op1))
2163           predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, TAKEN);
2164         break;
2165
2166       default:
2167         break;
2168       }
2169 }
2170
2171 /* Try to guess whether the value of return means error code.  */
2172
2173 static enum br_predictor
2174 return_prediction (tree val, enum prediction *prediction)
2175 {
2176   /* VOID.  */
2177   if (!val)
2178     return PRED_NO_PREDICTION;
2179   /* Different heuristics for pointers and scalars.  */
2180   if (POINTER_TYPE_P (TREE_TYPE (val)))
2181     {
2182       /* NULL is usually not returned.  */
2183       if (integer_zerop (val))
2184         {
2185           *prediction = NOT_TAKEN;
2186           return PRED_NULL_RETURN;
2187         }
2188     }
2189   else if (INTEGRAL_TYPE_P (TREE_TYPE (val)))
2190     {
2191       /* Negative return values are often used to indicate
2192          errors.  */
2193       if (TREE_CODE (val) == INTEGER_CST
2194           && tree_int_cst_sgn (val) < 0)
2195         {
2196           *prediction = NOT_TAKEN;
2197           return PRED_NEGATIVE_RETURN;
2198         }
2199       /* Constant return values seems to be commonly taken.
2200          Zero/one often represent booleans so exclude them from the
2201          heuristics.  */
2202       if (TREE_CONSTANT (val)
2203           && (!integer_zerop (val) && !integer_onep (val)))
2204         {
2205           *prediction = TAKEN;
2206           return PRED_CONST_RETURN;
2207         }
2208     }
2209   return PRED_NO_PREDICTION;
2210 }
2211
2212 /* Find the basic block with return expression and look up for possible
2213    return value trying to apply RETURN_PREDICTION heuristics.  */
2214 static void
2215 apply_return_prediction (void)
2216 {
2217   gimple return_stmt = NULL;
2218   tree return_val;
2219   edge e;
2220   gimple phi;
2221   int phi_num_args, i;
2222   enum br_predictor pred;
2223   enum prediction direction;
2224   edge_iterator ei;
2225
2226   FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
2227     {
2228       return_stmt = last_stmt (e->src);
2229       if (return_stmt
2230           && gimple_code (return_stmt) == GIMPLE_RETURN)
2231         break;
2232     }
2233   if (!e)
2234     return;
2235   return_val = gimple_return_retval (return_stmt);
2236   if (!return_val)
2237     return;
2238   if (TREE_CODE (return_val) != SSA_NAME
2239       || !SSA_NAME_DEF_STMT (return_val)
2240       || gimple_code (SSA_NAME_DEF_STMT (return_val)) != GIMPLE_PHI)
2241     return;
2242   phi = SSA_NAME_DEF_STMT (return_val);
2243   phi_num_args = gimple_phi_num_args (phi);
2244   pred = return_prediction (PHI_ARG_DEF (phi, 0), &direction);
2245
2246   /* Avoid the degenerate case where all return values form the function
2247      belongs to same category (ie they are all positive constants)
2248      so we can hardly say something about them.  */
2249   for (i = 1; i < phi_num_args; i++)
2250     if (pred != return_prediction (PHI_ARG_DEF (phi, i), &direction))
2251       break;
2252   if (i != phi_num_args)
2253     for (i = 0; i < phi_num_args; i++)
2254       {
2255         pred = return_prediction (PHI_ARG_DEF (phi, i), &direction);
2256         if (pred != PRED_NO_PREDICTION)
2257           predict_paths_leading_to_edge (gimple_phi_arg_edge (phi, i), pred,
2258                                          direction);
2259       }
2260 }
2261
2262 /* Look for basic block that contains unlikely to happen events
2263    (such as noreturn calls) and mark all paths leading to execution
2264    of this basic blocks as unlikely.  */
2265
2266 static void
2267 tree_bb_level_predictions (void)
2268 {
2269   basic_block bb;
2270   bool has_return_edges = false;
2271   edge e;
2272   edge_iterator ei;
2273
2274   FOR_EACH_EDGE (e, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
2275     if (!(e->flags & (EDGE_ABNORMAL | EDGE_FAKE | EDGE_EH)))
2276       {
2277         has_return_edges = true;
2278         break;
2279       }
2280
2281   apply_return_prediction ();
2282
2283   FOR_EACH_BB_FN (bb, cfun)
2284     {
2285       gimple_stmt_iterator gsi;
2286
2287       for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2288         {
2289           gimple stmt = gsi_stmt (gsi);
2290           tree decl;
2291
2292           if (is_gimple_call (stmt))
2293             {
2294               if ((gimple_call_flags (stmt) & ECF_NORETURN)
2295                   && has_return_edges)
2296                 predict_paths_leading_to (bb, PRED_NORETURN,
2297                                           NOT_TAKEN);
2298               decl = gimple_call_fndecl (stmt);
2299               if (decl
2300                   && lookup_attribute ("cold",
2301                                        DECL_ATTRIBUTES (decl)))
2302                 predict_paths_leading_to (bb, PRED_COLD_FUNCTION,
2303                                           NOT_TAKEN);
2304             }
2305           else if (gimple_code (stmt) == GIMPLE_PREDICT)
2306             {
2307               predict_paths_leading_to (bb, gimple_predict_predictor (stmt),
2308                                         gimple_predict_outcome (stmt));
2309               /* Keep GIMPLE_PREDICT around so early inlining will propagate
2310                  hints to callers.  */
2311             }
2312         }
2313     }
2314 }
2315
2316 #ifdef ENABLE_CHECKING
2317
2318 /* Callback for pointer_map_traverse, asserts that the pointer map is
2319    empty.  */
2320
2321 static bool
2322 assert_is_empty (const void *key ATTRIBUTE_UNUSED, void **value,
2323                  void *data ATTRIBUTE_UNUSED)
2324 {
2325   gcc_assert (!*value);
2326   return false;
2327 }
2328 #endif
2329
2330 /* Predict branch probabilities and estimate profile for basic block BB.  */
2331
2332 static void
2333 tree_estimate_probability_bb (basic_block bb)
2334 {
2335   edge e;
2336   edge_iterator ei;
2337   gimple last;
2338
2339   FOR_EACH_EDGE (e, ei, bb->succs)
2340     {
2341       /* Predict edges to user labels with attributes.  */
2342       if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
2343         {
2344           gimple_stmt_iterator gi;
2345           for (gi = gsi_start_bb (e->dest); !gsi_end_p (gi); gsi_next (&gi))
2346             {
2347               gimple stmt = gsi_stmt (gi);
2348               tree decl;
2349
2350               if (gimple_code (stmt) != GIMPLE_LABEL)
2351                 break;
2352               decl = gimple_label_label (stmt);
2353               if (DECL_ARTIFICIAL (decl))
2354                 continue;
2355
2356               /* Finally, we have a user-defined label.  */
2357               if (lookup_attribute ("cold", DECL_ATTRIBUTES (decl)))
2358                 predict_edge_def (e, PRED_COLD_LABEL, NOT_TAKEN);
2359               else if (lookup_attribute ("hot", DECL_ATTRIBUTES (decl)))
2360                 predict_edge_def (e, PRED_HOT_LABEL, TAKEN);
2361             }
2362         }
2363
2364       /* Predict early returns to be probable, as we've already taken
2365          care for error returns and other cases are often used for
2366          fast paths through function.
2367
2368          Since we've already removed the return statements, we are
2369          looking for CFG like:
2370
2371          if (conditional)
2372          {
2373          ..
2374          goto return_block
2375          }
2376          some other blocks
2377          return_block:
2378          return_stmt.  */
2379       if (e->dest != bb->next_bb
2380           && e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun)
2381           && single_succ_p (e->dest)
2382           && single_succ_edge (e->dest)->dest == EXIT_BLOCK_PTR_FOR_FN (cfun)
2383           && (last = last_stmt (e->dest)) != NULL
2384           && gimple_code (last) == GIMPLE_RETURN)
2385         {
2386           edge e1;
2387           edge_iterator ei1;
2388
2389           if (single_succ_p (bb))
2390             {
2391               FOR_EACH_EDGE (e1, ei1, bb->preds)
2392                 if (!predicted_by_p (e1->src, PRED_NULL_RETURN)
2393                     && !predicted_by_p (e1->src, PRED_CONST_RETURN)
2394                     && !predicted_by_p (e1->src, PRED_NEGATIVE_RETURN))
2395                   predict_edge_def (e1, PRED_TREE_EARLY_RETURN, NOT_TAKEN);
2396             }
2397           else
2398             if (!predicted_by_p (e->src, PRED_NULL_RETURN)
2399                 && !predicted_by_p (e->src, PRED_CONST_RETURN)
2400                 && !predicted_by_p (e->src, PRED_NEGATIVE_RETURN))
2401               predict_edge_def (e, PRED_TREE_EARLY_RETURN, NOT_TAKEN);
2402         }
2403
2404       /* Look for block we are guarding (ie we dominate it,
2405          but it doesn't postdominate us).  */
2406       if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun) && e->dest != bb
2407           && dominated_by_p (CDI_DOMINATORS, e->dest, e->src)
2408           && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e->dest))
2409         {
2410           gimple_stmt_iterator bi;
2411
2412           /* The call heuristic claims that a guarded function call
2413              is improbable.  This is because such calls are often used
2414              to signal exceptional situations such as printing error
2415              messages.  */
2416           for (bi = gsi_start_bb (e->dest); !gsi_end_p (bi);
2417                gsi_next (&bi))
2418             {
2419               gimple stmt = gsi_stmt (bi);
2420               if (is_gimple_call (stmt)
2421                   /* Constant and pure calls are hardly used to signalize
2422                      something exceptional.  */
2423                   && gimple_has_side_effects (stmt))
2424                 {
2425                   predict_edge_def (e, PRED_CALL, NOT_TAKEN);
2426                   break;
2427                 }
2428             }
2429         }
2430     }
2431   tree_predict_by_opcode (bb);
2432 }
2433
2434 /* Predict branch probabilities and estimate profile of the tree CFG.
2435    This function can be called from the loop optimizers to recompute
2436    the profile information.  */
2437
2438 void
2439 tree_estimate_probability (void)
2440 {
2441   basic_block bb;
2442
2443   add_noreturn_fake_exit_edges ();
2444   connect_infinite_loops_to_exit ();
2445   /* We use loop_niter_by_eval, which requires that the loops have
2446      preheaders.  */
2447   create_preheaders (CP_SIMPLE_PREHEADERS);
2448   calculate_dominance_info (CDI_POST_DOMINATORS);
2449
2450   bb_predictions = pointer_map_create ();
2451   tree_bb_level_predictions ();
2452   record_loop_exits ();
2453
2454   if (number_of_loops (cfun) > 1)
2455     predict_loops ();
2456
2457   FOR_EACH_BB_FN (bb, cfun)
2458     tree_estimate_probability_bb (bb);
2459
2460   FOR_EACH_BB_FN (bb, cfun)
2461     combine_predictions_for_bb (bb);
2462
2463 #ifdef ENABLE_CHECKING
2464   pointer_map_traverse (bb_predictions, assert_is_empty, NULL);
2465 #endif
2466   pointer_map_destroy (bb_predictions);
2467   bb_predictions = NULL;
2468
2469   estimate_bb_frequencies (false);
2470   free_dominance_info (CDI_POST_DOMINATORS);
2471   remove_fake_exit_edges ();
2472 }
2473
2474 /* Predict branch probabilities and estimate profile of the tree CFG.
2475    This is the driver function for PASS_PROFILE.  */
2476
2477 static unsigned int
2478 tree_estimate_probability_driver (void)
2479 {
2480   unsigned nb_loops;
2481
2482   loop_optimizer_init (LOOPS_NORMAL);
2483   if (dump_file && (dump_flags & TDF_DETAILS))
2484     flow_loops_dump (dump_file, NULL, 0);
2485
2486   mark_irreducible_loops ();
2487
2488   nb_loops = number_of_loops (cfun);
2489   if (nb_loops > 1)
2490     scev_initialize ();
2491
2492   tree_estimate_probability ();
2493
2494   if (nb_loops > 1)
2495     scev_finalize ();
2496
2497   loop_optimizer_finalize ();
2498   if (dump_file && (dump_flags & TDF_DETAILS))
2499     gimple_dump_cfg (dump_file, dump_flags);
2500   if (profile_status_for_fn (cfun) == PROFILE_ABSENT)
2501     profile_status_for_fn (cfun) = PROFILE_GUESSED;
2502   return 0;
2503 }
2504 \f
2505 /* Predict edges to successors of CUR whose sources are not postdominated by
2506    BB by PRED and recurse to all postdominators.  */
2507
2508 static void
2509 predict_paths_for_bb (basic_block cur, basic_block bb,
2510                       enum br_predictor pred,
2511                       enum prediction taken,
2512                       bitmap visited)
2513 {
2514   edge e;
2515   edge_iterator ei;
2516   basic_block son;
2517
2518   /* We are looking for all edges forming edge cut induced by
2519      set of all blocks postdominated by BB.  */
2520   FOR_EACH_EDGE (e, ei, cur->preds)
2521     if (e->src->index >= NUM_FIXED_BLOCKS
2522         && !dominated_by_p (CDI_POST_DOMINATORS, e->src, bb))
2523     {
2524       edge e2;
2525       edge_iterator ei2;
2526       bool found = false;
2527
2528       /* Ignore fake edges and eh, we predict them as not taken anyway.  */
2529       if (e->flags & (EDGE_EH | EDGE_FAKE))
2530         continue;
2531       gcc_assert (bb == cur || dominated_by_p (CDI_POST_DOMINATORS, cur, bb));
2532
2533       /* See if there is an edge from e->src that is not abnormal
2534          and does not lead to BB.  */
2535       FOR_EACH_EDGE (e2, ei2, e->src->succs)
2536         if (e2 != e
2537             && !(e2->flags & (EDGE_EH | EDGE_FAKE))
2538             && !dominated_by_p (CDI_POST_DOMINATORS, e2->dest, bb))
2539           {
2540             found = true;
2541             break;
2542           }
2543
2544       /* If there is non-abnormal path leaving e->src, predict edge
2545          using predictor.  Otherwise we need to look for paths
2546          leading to e->src.
2547
2548          The second may lead to infinite loop in the case we are predicitng
2549          regions that are only reachable by abnormal edges.  We simply
2550          prevent visiting given BB twice.  */
2551       if (found)
2552         predict_edge_def (e, pred, taken);
2553       else if (bitmap_set_bit (visited, e->src->index))
2554         predict_paths_for_bb (e->src, e->src, pred, taken, visited);
2555     }
2556   for (son = first_dom_son (CDI_POST_DOMINATORS, cur);
2557        son;
2558        son = next_dom_son (CDI_POST_DOMINATORS, son))
2559     predict_paths_for_bb (son, bb, pred, taken, visited);
2560 }
2561
2562 /* Sets branch probabilities according to PREDiction and
2563    FLAGS.  */
2564
2565 static void
2566 predict_paths_leading_to (basic_block bb, enum br_predictor pred,
2567                           enum prediction taken)
2568 {
2569   bitmap visited = BITMAP_ALLOC (NULL);
2570   predict_paths_for_bb (bb, bb, pred, taken, visited);
2571   BITMAP_FREE (visited);
2572 }
2573
2574 /* Like predict_paths_leading_to but take edge instead of basic block.  */
2575
2576 static void
2577 predict_paths_leading_to_edge (edge e, enum br_predictor pred,
2578                                enum prediction taken)
2579 {
2580   bool has_nonloop_edge = false;
2581   edge_iterator ei;
2582   edge e2;
2583
2584   basic_block bb = e->src;
2585   FOR_EACH_EDGE (e2, ei, bb->succs)
2586     if (e2->dest != e->src && e2->dest != e->dest
2587         && !(e->flags & (EDGE_EH | EDGE_FAKE))
2588         && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e2->dest))
2589       {
2590         has_nonloop_edge = true;
2591         break;
2592       }
2593   if (!has_nonloop_edge)
2594     {
2595       bitmap visited = BITMAP_ALLOC (NULL);
2596       predict_paths_for_bb (bb, bb, pred, taken, visited);
2597       BITMAP_FREE (visited);
2598     }
2599   else
2600     predict_edge_def (e, pred, taken);
2601 }
2602 \f
2603 /* This is used to carry information about basic blocks.  It is
2604    attached to the AUX field of the standard CFG block.  */
2605
2606 typedef struct block_info_def
2607 {
2608   /* Estimated frequency of execution of basic_block.  */
2609   sreal frequency;
2610
2611   /* To keep queue of basic blocks to process.  */
2612   basic_block next;
2613
2614   /* Number of predecessors we need to visit first.  */
2615   int npredecessors;
2616 } *block_info;
2617
2618 /* Similar information for edges.  */
2619 typedef struct edge_info_def
2620 {
2621   /* In case edge is a loopback edge, the probability edge will be reached
2622      in case header is.  Estimated number of iterations of the loop can be
2623      then computed as 1 / (1 - back_edge_prob).  */
2624   sreal back_edge_prob;
2625   /* True if the edge is a loopback edge in the natural loop.  */
2626   unsigned int back_edge:1;
2627 } *edge_info;
2628
2629 #define BLOCK_INFO(B)   ((block_info) (B)->aux)
2630 #define EDGE_INFO(E)    ((edge_info) (E)->aux)
2631
2632 /* Helper function for estimate_bb_frequencies.
2633    Propagate the frequencies in blocks marked in
2634    TOVISIT, starting in HEAD.  */
2635
2636 static void
2637 propagate_freq (basic_block head, bitmap tovisit)
2638 {
2639   basic_block bb;
2640   basic_block last;
2641   unsigned i;
2642   edge e;
2643   basic_block nextbb;
2644   bitmap_iterator bi;
2645
2646   /* For each basic block we need to visit count number of his predecessors
2647      we need to visit first.  */
2648   EXECUTE_IF_SET_IN_BITMAP (tovisit, 0, i, bi)
2649     {
2650       edge_iterator ei;
2651       int count = 0;
2652
2653       bb = BASIC_BLOCK_FOR_FN (cfun, i);
2654
2655       FOR_EACH_EDGE (e, ei, bb->preds)
2656         {
2657           bool visit = bitmap_bit_p (tovisit, e->src->index);
2658
2659           if (visit && !(e->flags & EDGE_DFS_BACK))
2660             count++;
2661           else if (visit && dump_file && !EDGE_INFO (e)->back_edge)
2662             fprintf (dump_file,
2663                      "Irreducible region hit, ignoring edge to %i->%i\n",
2664                      e->src->index, bb->index);
2665         }
2666       BLOCK_INFO (bb)->npredecessors = count;
2667       /* When function never returns, we will never process exit block.  */
2668       if (!count && bb == EXIT_BLOCK_PTR_FOR_FN (cfun))
2669         bb->count = bb->frequency = 0;
2670     }
2671
2672   memcpy (&BLOCK_INFO (head)->frequency, &real_one, sizeof (real_one));
2673   last = head;
2674   for (bb = head; bb; bb = nextbb)
2675     {
2676       edge_iterator ei;
2677       sreal cyclic_probability, frequency;
2678
2679       memcpy (&cyclic_probability, &real_zero, sizeof (real_zero));
2680       memcpy (&frequency, &real_zero, sizeof (real_zero));
2681
2682       nextbb = BLOCK_INFO (bb)->next;
2683       BLOCK_INFO (bb)->next = NULL;
2684
2685       /* Compute frequency of basic block.  */
2686       if (bb != head)
2687         {
2688 #ifdef ENABLE_CHECKING
2689           FOR_EACH_EDGE (e, ei, bb->preds)
2690             gcc_assert (!bitmap_bit_p (tovisit, e->src->index)
2691                         || (e->flags & EDGE_DFS_BACK));
2692 #endif
2693
2694           FOR_EACH_EDGE (e, ei, bb->preds)
2695             if (EDGE_INFO (e)->back_edge)
2696               {
2697                 sreal_add (&cyclic_probability, &cyclic_probability,
2698                            &EDGE_INFO (e)->back_edge_prob);
2699               }
2700             else if (!(e->flags & EDGE_DFS_BACK))
2701               {
2702                 sreal tmp;
2703
2704                 /*  frequency += (e->probability
2705                                   * BLOCK_INFO (e->src)->frequency /
2706                                   REG_BR_PROB_BASE);  */
2707
2708                 sreal_init (&tmp, e->probability, 0);
2709                 sreal_mul (&tmp, &tmp, &BLOCK_INFO (e->src)->frequency);
2710                 sreal_mul (&tmp, &tmp, &real_inv_br_prob_base);
2711                 sreal_add (&frequency, &frequency, &tmp);
2712               }
2713
2714           if (sreal_compare (&cyclic_probability, &real_zero) == 0)
2715             {
2716               memcpy (&BLOCK_INFO (bb)->frequency, &frequency,
2717                       sizeof (frequency));
2718             }
2719           else
2720             {
2721               if (sreal_compare (&cyclic_probability, &real_almost_one) > 0)
2722                 {
2723                   memcpy (&cyclic_probability, &real_almost_one,
2724                           sizeof (real_almost_one));
2725                 }
2726
2727               /* BLOCK_INFO (bb)->frequency = frequency
2728                                               / (1 - cyclic_probability) */
2729
2730               sreal_sub (&cyclic_probability, &real_one, &cyclic_probability);
2731               sreal_div (&BLOCK_INFO (bb)->frequency,
2732                          &frequency, &cyclic_probability);
2733             }
2734         }
2735
2736       bitmap_clear_bit (tovisit, bb->index);
2737
2738       e = find_edge (bb, head);
2739       if (e)
2740         {
2741           sreal tmp;
2742
2743           /* EDGE_INFO (e)->back_edge_prob
2744              = ((e->probability * BLOCK_INFO (bb)->frequency)
2745              / REG_BR_PROB_BASE); */
2746
2747           sreal_init (&tmp, e->probability, 0);
2748           sreal_mul (&tmp, &tmp, &BLOCK_INFO (bb)->frequency);
2749           sreal_mul (&EDGE_INFO (e)->back_edge_prob,
2750                      &tmp, &real_inv_br_prob_base);
2751         }
2752
2753       /* Propagate to successor blocks.  */
2754       FOR_EACH_EDGE (e, ei, bb->succs)
2755         if (!(e->flags & EDGE_DFS_BACK)
2756             && BLOCK_INFO (e->dest)->npredecessors)
2757           {
2758             BLOCK_INFO (e->dest)->npredecessors--;
2759             if (!BLOCK_INFO (e->dest)->npredecessors)
2760               {
2761                 if (!nextbb)
2762                   nextbb = e->dest;
2763                 else
2764                   BLOCK_INFO (last)->next = e->dest;
2765
2766                 last = e->dest;
2767               }
2768           }
2769     }
2770 }
2771
2772 /* Estimate frequencies in loops at same nest level.  */
2773
2774 static void
2775 estimate_loops_at_level (struct loop *first_loop)
2776 {
2777   struct loop *loop;
2778
2779   for (loop = first_loop; loop; loop = loop->next)
2780     {
2781       edge e;
2782       basic_block *bbs;
2783       unsigned i;
2784       bitmap tovisit = BITMAP_ALLOC (NULL);
2785
2786       estimate_loops_at_level (loop->inner);
2787
2788       /* Find current loop back edge and mark it.  */
2789       e = loop_latch_edge (loop);
2790       EDGE_INFO (e)->back_edge = 1;
2791
2792       bbs = get_loop_body (loop);
2793       for (i = 0; i < loop->num_nodes; i++)
2794         bitmap_set_bit (tovisit, bbs[i]->index);
2795       free (bbs);
2796       propagate_freq (loop->header, tovisit);
2797       BITMAP_FREE (tovisit);
2798     }
2799 }
2800
2801 /* Propagates frequencies through structure of loops.  */
2802
2803 static void
2804 estimate_loops (void)
2805 {
2806   bitmap tovisit = BITMAP_ALLOC (NULL);
2807   basic_block bb;
2808
2809   /* Start by estimating the frequencies in the loops.  */
2810   if (number_of_loops (cfun) > 1)
2811     estimate_loops_at_level (current_loops->tree_root->inner);
2812
2813   /* Now propagate the frequencies through all the blocks.  */
2814   FOR_ALL_BB_FN (bb, cfun)
2815     {
2816       bitmap_set_bit (tovisit, bb->index);
2817     }
2818   propagate_freq (ENTRY_BLOCK_PTR_FOR_FN (cfun), tovisit);
2819   BITMAP_FREE (tovisit);
2820 }
2821
2822 /* Drop the profile for NODE to guessed, and update its frequency based on
2823    whether it is expected to be hot given the CALL_COUNT.  */
2824
2825 static void
2826 drop_profile (struct cgraph_node *node, gcov_type call_count)
2827 {
2828   struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2829   /* In the case where this was called by another function with a
2830      dropped profile, call_count will be 0. Since there are no
2831      non-zero call counts to this function, we don't know for sure
2832      whether it is hot, and therefore it will be marked normal below.  */
2833   bool hot = maybe_hot_count_p (NULL, call_count);
2834
2835   if (dump_file)
2836     fprintf (dump_file,
2837              "Dropping 0 profile for %s/%i. %s based on calls.\n",
2838              node->name (), node->order,
2839              hot ? "Function is hot" : "Function is normal");
2840   /* We only expect to miss profiles for functions that are reached
2841      via non-zero call edges in cases where the function may have
2842      been linked from another module or library (COMDATs and extern
2843      templates). See the comments below for handle_missing_profiles.
2844      Also, only warn in cases where the missing counts exceed the
2845      number of training runs. In certain cases with an execv followed
2846      by a no-return call the profile for the no-return call is not
2847      dumped and there can be a mismatch.  */
2848   if (!DECL_COMDAT (node->decl) && !DECL_EXTERNAL (node->decl)
2849       && call_count > profile_info->runs)
2850     {
2851       if (flag_profile_correction)
2852         {
2853           if (dump_file)
2854             fprintf (dump_file,
2855                      "Missing counts for called function %s/%i\n",
2856                      node->name (), node->order);
2857         }
2858       else
2859         warning (0, "Missing counts for called function %s/%i",
2860                  node->name (), node->order);
2861     }
2862
2863   profile_status_for_fn (fn)
2864       = (flag_guess_branch_prob ? PROFILE_GUESSED : PROFILE_ABSENT);
2865   node->frequency
2866       = hot ? NODE_FREQUENCY_HOT : NODE_FREQUENCY_NORMAL;
2867 }
2868
2869 /* In the case of COMDAT routines, multiple object files will contain the same
2870    function and the linker will select one for the binary. In that case
2871    all the other copies from the profile instrument binary will be missing
2872    profile counts. Look for cases where this happened, due to non-zero
2873    call counts going to 0-count functions, and drop the profile to guessed
2874    so that we can use the estimated probabilities and avoid optimizing only
2875    for size.
2876
2877    The other case where the profile may be missing is when the routine
2878    is not going to be emitted to the object file, e.g. for "extern template"
2879    class methods. Those will be marked DECL_EXTERNAL. Emit a warning in
2880    all other cases of non-zero calls to 0-count functions.  */
2881
2882 void
2883 handle_missing_profiles (void)
2884 {
2885   struct cgraph_node *node;
2886   int unlikely_count_fraction = PARAM_VALUE (UNLIKELY_BB_COUNT_FRACTION);
2887   vec<struct cgraph_node *> worklist;
2888   worklist.create (64);
2889
2890   /* See if 0 count function has non-0 count callers.  In this case we
2891      lost some profile.  Drop its function profile to PROFILE_GUESSED.  */
2892   FOR_EACH_DEFINED_FUNCTION (node)
2893     {
2894       struct cgraph_edge *e;
2895       gcov_type call_count = 0;
2896       gcov_type max_tp_first_run = 0;
2897       struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2898
2899       if (node->count)
2900         continue;
2901       for (e = node->callers; e; e = e->next_caller)
2902       {
2903         call_count += e->count;
2904
2905         if (e->caller->tp_first_run > max_tp_first_run)
2906           max_tp_first_run = e->caller->tp_first_run;
2907       }
2908
2909       /* If time profile is missing, let assign the maximum that comes from
2910          caller functions.  */
2911       if (!node->tp_first_run && max_tp_first_run)
2912         node->tp_first_run = max_tp_first_run + 1;
2913
2914       if (call_count
2915           && fn && fn->cfg
2916           && (call_count * unlikely_count_fraction >= profile_info->runs))
2917         {
2918           drop_profile (node, call_count);
2919           worklist.safe_push (node);
2920         }
2921     }
2922
2923   /* Propagate the profile dropping to other 0-count COMDATs that are
2924      potentially called by COMDATs we already dropped the profile on.  */
2925   while (worklist.length () > 0)
2926     {
2927       struct cgraph_edge *e;
2928
2929       node = worklist.pop ();
2930       for (e = node->callees; e; e = e->next_caller)
2931         {
2932           struct cgraph_node *callee = e->callee;
2933           struct function *fn = DECL_STRUCT_FUNCTION (callee->decl);
2934
2935           if (callee->count > 0)
2936             continue;
2937           if (DECL_COMDAT (callee->decl) && fn && fn->cfg
2938               && profile_status_for_fn (fn) == PROFILE_READ)
2939             {
2940               drop_profile (node, 0);
2941               worklist.safe_push (callee);
2942             }
2943         }
2944     }
2945   worklist.release ();
2946 }
2947
2948 /* Convert counts measured by profile driven feedback to frequencies.
2949    Return nonzero iff there was any nonzero execution count.  */
2950
2951 int
2952 counts_to_freqs (void)
2953 {
2954   gcov_type count_max, true_count_max = 0;
2955   basic_block bb;
2956
2957   /* Don't overwrite the estimated frequencies when the profile for
2958      the function is missing.  We may drop this function PROFILE_GUESSED
2959      later in drop_profile ().  */
2960   if (!ENTRY_BLOCK_PTR_FOR_FN (cfun)->count)
2961     return 0;
2962
2963   FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
2964     true_count_max = MAX (bb->count, true_count_max);
2965
2966   count_max = MAX (true_count_max, 1);
2967   FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
2968     bb->frequency = (bb->count * BB_FREQ_MAX + count_max / 2) / count_max;
2969
2970   return true_count_max;
2971 }
2972
2973 /* Return true if function is likely to be expensive, so there is no point to
2974    optimize performance of prologue, epilogue or do inlining at the expense
2975    of code size growth.  THRESHOLD is the limit of number of instructions
2976    function can execute at average to be still considered not expensive.  */
2977
2978 bool
2979 expensive_function_p (int threshold)
2980 {
2981   unsigned int sum = 0;
2982   basic_block bb;
2983   unsigned int limit;
2984
2985   /* We can not compute accurately for large thresholds due to scaled
2986      frequencies.  */
2987   gcc_assert (threshold <= BB_FREQ_MAX);
2988
2989   /* Frequencies are out of range.  This either means that function contains
2990      internal loop executing more than BB_FREQ_MAX times or profile feedback
2991      is available and function has not been executed at all.  */
2992   if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency == 0)
2993     return true;
2994
2995   /* Maximally BB_FREQ_MAX^2 so overflow won't happen.  */
2996   limit = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency * threshold;
2997   FOR_EACH_BB_FN (bb, cfun)
2998     {
2999       rtx insn;
3000
3001       FOR_BB_INSNS (bb, insn)
3002         if (active_insn_p (insn))
3003           {
3004             sum += bb->frequency;
3005             if (sum > limit)
3006               return true;
3007         }
3008     }
3009
3010   return false;
3011 }
3012
3013 /* Estimate and propagate basic block frequencies using the given branch
3014    probabilities.  If FORCE is true, the frequencies are used to estimate
3015    the counts even when there are already non-zero profile counts.  */
3016
3017 void
3018 estimate_bb_frequencies (bool force)
3019 {
3020   basic_block bb;
3021   sreal freq_max;
3022
3023   if (force || profile_status_for_fn (cfun) != PROFILE_READ || !counts_to_freqs ())
3024     {
3025       static int real_values_initialized = 0;
3026
3027       if (!real_values_initialized)
3028         {
3029           real_values_initialized = 1;
3030           sreal_init (&real_zero, 0, 0);
3031           sreal_init (&real_one, 1, 0);
3032           sreal_init (&real_br_prob_base, REG_BR_PROB_BASE, 0);
3033           sreal_init (&real_bb_freq_max, BB_FREQ_MAX, 0);
3034           sreal_init (&real_one_half, 1, -1);
3035           sreal_div (&real_inv_br_prob_base, &real_one, &real_br_prob_base);
3036           sreal_sub (&real_almost_one, &real_one, &real_inv_br_prob_base);
3037         }
3038
3039       mark_dfs_back_edges ();
3040
3041       single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun))->probability =
3042          REG_BR_PROB_BASE;
3043
3044       /* Set up block info for each basic block.  */
3045       alloc_aux_for_blocks (sizeof (struct block_info_def));
3046       alloc_aux_for_edges (sizeof (struct edge_info_def));
3047       FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3048         {
3049           edge e;
3050           edge_iterator ei;
3051
3052           FOR_EACH_EDGE (e, ei, bb->succs)
3053             {
3054               sreal_init (&EDGE_INFO (e)->back_edge_prob, e->probability, 0);
3055               sreal_mul (&EDGE_INFO (e)->back_edge_prob,
3056                          &EDGE_INFO (e)->back_edge_prob,
3057                          &real_inv_br_prob_base);
3058             }
3059         }
3060
3061       /* First compute frequencies locally for each loop from innermost
3062          to outermost to examine frequencies for back edges.  */
3063       estimate_loops ();
3064
3065       memcpy (&freq_max, &real_zero, sizeof (real_zero));
3066       FOR_EACH_BB_FN (bb, cfun)
3067         if (sreal_compare (&freq_max, &BLOCK_INFO (bb)->frequency) < 0)
3068           memcpy (&freq_max, &BLOCK_INFO (bb)->frequency, sizeof (freq_max));
3069
3070       sreal_div (&freq_max, &real_bb_freq_max, &freq_max);
3071       FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3072         {
3073           sreal tmp;
3074
3075           sreal_mul (&tmp, &BLOCK_INFO (bb)->frequency, &freq_max);
3076           sreal_add (&tmp, &tmp, &real_one_half);
3077           bb->frequency = sreal_to_int (&tmp);
3078         }
3079
3080       free_aux_for_blocks ();
3081       free_aux_for_edges ();
3082     }
3083   compute_function_frequency ();
3084 }
3085
3086 /* Decide whether function is hot, cold or unlikely executed.  */
3087 void
3088 compute_function_frequency (void)
3089 {
3090   basic_block bb;
3091   struct cgraph_node *node = cgraph_get_node (current_function_decl);
3092
3093   if (DECL_STATIC_CONSTRUCTOR (current_function_decl)
3094       || MAIN_NAME_P (DECL_NAME (current_function_decl)))
3095     node->only_called_at_startup = true;
3096   if (DECL_STATIC_DESTRUCTOR (current_function_decl))
3097     node->only_called_at_exit = true;
3098
3099   if (profile_status_for_fn (cfun) != PROFILE_READ)
3100     {
3101       int flags = flags_from_decl_or_type (current_function_decl);
3102       if (lookup_attribute ("cold", DECL_ATTRIBUTES (current_function_decl))
3103           != NULL)
3104         node->frequency = NODE_FREQUENCY_UNLIKELY_EXECUTED;
3105       else if (lookup_attribute ("hot", DECL_ATTRIBUTES (current_function_decl))
3106                != NULL)
3107         node->frequency = NODE_FREQUENCY_HOT;
3108       else if (flags & ECF_NORETURN)
3109         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3110       else if (MAIN_NAME_P (DECL_NAME (current_function_decl)))
3111         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3112       else if (DECL_STATIC_CONSTRUCTOR (current_function_decl)
3113                || DECL_STATIC_DESTRUCTOR (current_function_decl))
3114         node->frequency = NODE_FREQUENCY_EXECUTED_ONCE;
3115       return;
3116     }
3117
3118   /* Only first time try to drop function into unlikely executed.
3119      After inlining the roundoff errors may confuse us.
3120      Ipa-profile pass will drop functions only called from unlikely
3121      functions to unlikely and that is most of what we care about.  */
3122   if (!cfun->after_inlining)
3123     node->frequency = NODE_FREQUENCY_UNLIKELY_EXECUTED;
3124   FOR_EACH_BB_FN (bb, cfun)
3125     {
3126       if (maybe_hot_bb_p (cfun, bb))
3127         {
3128           node->frequency = NODE_FREQUENCY_HOT;
3129           return;
3130         }
3131       if (!probably_never_executed_bb_p (cfun, bb))
3132         node->frequency = NODE_FREQUENCY_NORMAL;
3133     }
3134 }
3135
3136 static bool
3137 gate_estimate_probability (void)
3138 {
3139   return flag_guess_branch_prob;
3140 }
3141
3142 /* Build PREDICT_EXPR.  */
3143 tree
3144 build_predict_expr (enum br_predictor predictor, enum prediction taken)
3145 {
3146   tree t = build1 (PREDICT_EXPR, void_type_node,
3147                    build_int_cst (integer_type_node, predictor));
3148   SET_PREDICT_EXPR_OUTCOME (t, taken);
3149   return t;
3150 }
3151
3152 const char *
3153 predictor_name (enum br_predictor predictor)
3154 {
3155   return predictor_info[predictor].name;
3156 }
3157
3158 namespace {
3159
3160 const pass_data pass_data_profile =
3161 {
3162   GIMPLE_PASS, /* type */
3163   "profile_estimate", /* name */
3164   OPTGROUP_NONE, /* optinfo_flags */
3165   true, /* has_gate */
3166   true, /* has_execute */
3167   TV_BRANCH_PROB, /* tv_id */
3168   PROP_cfg, /* properties_required */
3169   0, /* properties_provided */
3170   0, /* properties_destroyed */
3171   0, /* todo_flags_start */
3172   TODO_verify_ssa, /* todo_flags_finish */
3173 };
3174
3175 class pass_profile : public gimple_opt_pass
3176 {
3177 public:
3178   pass_profile (gcc::context *ctxt)
3179     : gimple_opt_pass (pass_data_profile, ctxt)
3180   {}
3181
3182   /* opt_pass methods: */
3183   bool gate () { return gate_estimate_probability (); }
3184   unsigned int execute () { return tree_estimate_probability_driver (); }
3185
3186 }; // class pass_profile
3187
3188 } // anon namespace
3189
3190 gimple_opt_pass *
3191 make_pass_profile (gcc::context *ctxt)
3192 {
3193   return new pass_profile (ctxt);
3194 }
3195
3196 namespace {
3197
3198 const pass_data pass_data_strip_predict_hints =
3199 {
3200   GIMPLE_PASS, /* type */
3201   "*strip_predict_hints", /* name */
3202   OPTGROUP_NONE, /* optinfo_flags */
3203   false, /* has_gate */
3204   true, /* has_execute */
3205   TV_BRANCH_PROB, /* tv_id */
3206   PROP_cfg, /* properties_required */
3207   0, /* properties_provided */
3208   0, /* properties_destroyed */
3209   0, /* todo_flags_start */
3210   TODO_verify_ssa, /* todo_flags_finish */
3211 };
3212
3213 class pass_strip_predict_hints : public gimple_opt_pass
3214 {
3215 public:
3216   pass_strip_predict_hints (gcc::context *ctxt)
3217     : gimple_opt_pass (pass_data_strip_predict_hints, ctxt)
3218   {}
3219
3220   /* opt_pass methods: */
3221   opt_pass * clone () { return new pass_strip_predict_hints (m_ctxt); }
3222   unsigned int execute () { return strip_predict_hints (); }
3223
3224 }; // class pass_strip_predict_hints
3225
3226 } // anon namespace
3227
3228 gimple_opt_pass *
3229 make_pass_strip_predict_hints (gcc::context *ctxt)
3230 {
3231   return new pass_strip_predict_hints (ctxt);
3232 }
3233
3234 /* Rebuild function frequencies.  Passes are in general expected to
3235    maintain profile by hand, however in some cases this is not possible:
3236    for example when inlining several functions with loops freuqencies might run
3237    out of scale and thus needs to be recomputed.  */
3238
3239 void
3240 rebuild_frequencies (void)
3241 {
3242   timevar_push (TV_REBUILD_FREQUENCIES);
3243
3244   /* When the max bb count in the function is small, there is a higher
3245      chance that there were truncation errors in the integer scaling
3246      of counts by inlining and other optimizations. This could lead
3247      to incorrect classification of code as being cold when it isn't.
3248      In that case, force the estimation of bb counts/frequencies from the
3249      branch probabilities, rather than computing frequencies from counts,
3250      which may also lead to frequencies incorrectly reduced to 0. There
3251      is less precision in the probabilities, so we only do this for small
3252      max counts.  */
3253   gcov_type count_max = 0;
3254   basic_block bb;
3255   FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (cfun), NULL, next_bb)
3256     count_max = MAX (bb->count, count_max);
3257
3258   if (profile_status_for_fn (cfun) == PROFILE_GUESSED
3259       || (profile_status_for_fn (cfun) == PROFILE_READ && count_max < REG_BR_PROB_BASE/10))
3260     {
3261       loop_optimizer_init (0);
3262       add_noreturn_fake_exit_edges ();
3263       mark_irreducible_loops ();
3264       connect_infinite_loops_to_exit ();
3265       estimate_bb_frequencies (true);
3266       remove_fake_exit_edges ();
3267       loop_optimizer_finalize ();
3268     }
3269   else if (profile_status_for_fn (cfun) == PROFILE_READ)
3270     counts_to_freqs ();
3271   else
3272     gcc_unreachable ();
3273   timevar_pop (TV_REBUILD_FREQUENCIES);
3274 }