PR tree-optimization/17468
[official-gcc.git] / gcc / predict.c
blob3da32986238c2b2873320211fde81e2598dd38b6
1 /* Branch prediction routines for the GNU compiler.
2 Copyright (C) 2000, 2001, 2002, 2003, 2004 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 2, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING. If not, write to the Free
18 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
19 02111-1307, USA. */
21 /* References:
23 [1] "Branch Prediction for Free"
24 Ball and Larus; PLDI '93.
25 [2] "Static Branch Frequency and Program Profile Analysis"
26 Wu and Larus; MICRO-27.
27 [3] "Corpus-based Static Branch Prediction"
28 Calder, Grunwald, Lindsay, Martin, Mozer, and Zorn; PLDI '95. */
31 #include "config.h"
32 #include "system.h"
33 #include "coretypes.h"
34 #include "tm.h"
35 #include "tree.h"
36 #include "rtl.h"
37 #include "tm_p.h"
38 #include "hard-reg-set.h"
39 #include "basic-block.h"
40 #include "insn-config.h"
41 #include "regs.h"
42 #include "flags.h"
43 #include "output.h"
44 #include "function.h"
45 #include "except.h"
46 #include "toplev.h"
47 #include "recog.h"
48 #include "expr.h"
49 #include "predict.h"
50 #include "coverage.h"
51 #include "sreal.h"
52 #include "params.h"
53 #include "target.h"
54 #include "cfgloop.h"
55 #include "tree-flow.h"
56 #include "ggc.h"
57 #include "tree-dump.h"
58 #include "tree-pass.h"
59 #include "timevar.h"
60 #include "tree-scalar-evolution.h"
61 #include "cfgloop.h"
63 /* real constants: 0, 1, 1-1/REG_BR_PROB_BASE, REG_BR_PROB_BASE,
64 1/REG_BR_PROB_BASE, 0.5, BB_FREQ_MAX. */
65 static sreal real_zero, real_one, real_almost_one, real_br_prob_base,
66 real_inv_br_prob_base, real_one_half, real_bb_freq_max;
68 /* Random guesstimation given names. */
69 #define PROB_VERY_UNLIKELY (REG_BR_PROB_BASE / 10 - 1)
70 #define PROB_EVEN (REG_BR_PROB_BASE / 2)
71 #define PROB_VERY_LIKELY (REG_BR_PROB_BASE - PROB_VERY_UNLIKELY)
72 #define PROB_ALWAYS (REG_BR_PROB_BASE)
74 static void combine_predictions_for_insn (rtx, basic_block);
75 static void dump_prediction (FILE *, enum br_predictor, int, basic_block, int);
76 static void estimate_loops_at_level (struct loop *loop);
77 static void propagate_freq (struct loop *);
78 static void estimate_bb_frequencies (struct loops *);
79 static int counts_to_freqs (void);
80 static bool last_basic_block_p (basic_block);
81 static void compute_function_frequency (void);
82 static void choose_function_section (void);
83 static bool can_predict_insn_p (rtx);
85 /* Information we hold about each branch predictor.
86 Filled using information from predict.def. */
88 struct predictor_info
90 const char *const name; /* Name used in the debugging dumps. */
91 const int hitrate; /* Expected hitrate used by
92 predict_insn_def call. */
93 const int flags;
96 /* Use given predictor without Dempster-Shaffer theory if it matches
97 using first_match heuristics. */
98 #define PRED_FLAG_FIRST_MATCH 1
100 /* Recompute hitrate in percent to our representation. */
102 #define HITRATE(VAL) ((int) ((VAL) * REG_BR_PROB_BASE + 50) / 100)
104 #define DEF_PREDICTOR(ENUM, NAME, HITRATE, FLAGS) {NAME, HITRATE, FLAGS},
105 static const struct predictor_info predictor_info[]= {
106 #include "predict.def"
108 /* Upper bound on predictors. */
109 {NULL, 0, 0}
111 #undef DEF_PREDICTOR
113 /* Return true in case BB can be CPU intensive and should be optimized
114 for maximal performance. */
116 bool
117 maybe_hot_bb_p (basic_block bb)
119 if (profile_info && flag_branch_probabilities
120 && (bb->count
121 < profile_info->sum_max / PARAM_VALUE (HOT_BB_COUNT_FRACTION)))
122 return false;
123 if (bb->frequency < BB_FREQ_MAX / PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION))
124 return false;
125 return true;
128 /* Return true in case BB is cold and should be optimized for size. */
130 bool
131 probably_cold_bb_p (basic_block bb)
133 if (profile_info && flag_branch_probabilities
134 && (bb->count
135 < profile_info->sum_max / PARAM_VALUE (HOT_BB_COUNT_FRACTION)))
136 return true;
137 if (bb->frequency < BB_FREQ_MAX / PARAM_VALUE (HOT_BB_FREQUENCY_FRACTION))
138 return true;
139 return false;
142 /* Return true in case BB is probably never executed. */
143 bool
144 probably_never_executed_bb_p (basic_block bb)
146 if (profile_info && flag_branch_probabilities)
147 return ((bb->count + profile_info->runs / 2) / profile_info->runs) == 0;
148 return false;
151 /* Return true if the one of outgoing edges is already predicted by
152 PREDICTOR. */
154 bool
155 rtl_predicted_by_p (basic_block bb, enum br_predictor predictor)
157 rtx note;
158 if (!INSN_P (BB_END (bb)))
159 return false;
160 for (note = REG_NOTES (BB_END (bb)); note; note = XEXP (note, 1))
161 if (REG_NOTE_KIND (note) == REG_BR_PRED
162 && INTVAL (XEXP (XEXP (note, 0), 0)) == (int)predictor)
163 return true;
164 return false;
167 /* Return true if the one of outgoing edges is already predicted by
168 PREDICTOR. */
170 bool
171 tree_predicted_by_p (basic_block bb, enum br_predictor predictor)
173 struct edge_prediction *i = bb_ann (bb)->predictions;
174 for (i = bb_ann (bb)->predictions; i; i = i->next)
175 if (i->predictor == predictor)
176 return true;
177 return false;
180 void
181 predict_insn (rtx insn, enum br_predictor predictor, int probability)
183 if (!any_condjump_p (insn))
184 abort ();
185 if (!flag_guess_branch_prob)
186 return;
188 REG_NOTES (insn)
189 = gen_rtx_EXPR_LIST (REG_BR_PRED,
190 gen_rtx_CONCAT (VOIDmode,
191 GEN_INT ((int) predictor),
192 GEN_INT ((int) probability)),
193 REG_NOTES (insn));
196 /* Predict insn by given predictor. */
198 void
199 predict_insn_def (rtx insn, enum br_predictor predictor,
200 enum prediction taken)
202 int probability = predictor_info[(int) predictor].hitrate;
204 if (taken != TAKEN)
205 probability = REG_BR_PROB_BASE - probability;
207 predict_insn (insn, predictor, probability);
210 /* Predict edge E with given probability if possible. */
212 void
213 rtl_predict_edge (edge e, enum br_predictor predictor, int probability)
215 rtx last_insn;
216 last_insn = BB_END (e->src);
218 /* We can store the branch prediction information only about
219 conditional jumps. */
220 if (!any_condjump_p (last_insn))
221 return;
223 /* We always store probability of branching. */
224 if (e->flags & EDGE_FALLTHRU)
225 probability = REG_BR_PROB_BASE - probability;
227 predict_insn (last_insn, predictor, probability);
230 /* Predict edge E with the given PROBABILITY. */
231 void
232 tree_predict_edge (edge e, enum br_predictor predictor, int probability)
234 struct edge_prediction *i = ggc_alloc (sizeof (struct edge_prediction));
236 i->next = bb_ann (e->src)->predictions;
237 bb_ann (e->src)->predictions = i;
238 i->probability = probability;
239 i->predictor = predictor;
240 i->edge = e;
243 /* Return true when we can store prediction on insn INSN.
244 At the moment we represent predictions only on conditional
245 jumps, not at computed jump or other complicated cases. */
246 static bool
247 can_predict_insn_p (rtx insn)
249 return (JUMP_P (insn)
250 && any_condjump_p (insn)
251 && BLOCK_FOR_INSN (insn)->succ->succ_next);
254 /* Predict edge E by given predictor if possible. */
256 void
257 predict_edge_def (edge e, enum br_predictor predictor,
258 enum prediction taken)
260 int probability = predictor_info[(int) predictor].hitrate;
262 if (taken != TAKEN)
263 probability = REG_BR_PROB_BASE - probability;
265 predict_edge (e, predictor, probability);
268 /* Invert all branch predictions or probability notes in the INSN. This needs
269 to be done each time we invert the condition used by the jump. */
271 void
272 invert_br_probabilities (rtx insn)
274 rtx note;
276 for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
277 if (REG_NOTE_KIND (note) == REG_BR_PROB)
278 XEXP (note, 0) = GEN_INT (REG_BR_PROB_BASE - INTVAL (XEXP (note, 0)));
279 else if (REG_NOTE_KIND (note) == REG_BR_PRED)
280 XEXP (XEXP (note, 0), 1)
281 = GEN_INT (REG_BR_PROB_BASE - INTVAL (XEXP (XEXP (note, 0), 1)));
284 /* Dump information about the branch prediction to the output file. */
286 static void
287 dump_prediction (FILE *file, enum br_predictor predictor, int probability,
288 basic_block bb, int used)
290 edge e = bb->succ;
292 if (!file)
293 return;
295 while (e && (e->flags & EDGE_FALLTHRU))
296 e = e->succ_next;
298 fprintf (file, " %s heuristics%s: %.1f%%",
299 predictor_info[predictor].name,
300 used ? "" : " (ignored)", probability * 100.0 / REG_BR_PROB_BASE);
302 if (bb->count)
304 fprintf (file, " exec ");
305 fprintf (file, HOST_WIDEST_INT_PRINT_DEC, bb->count);
306 if (e)
308 fprintf (file, " hit ");
309 fprintf (file, HOST_WIDEST_INT_PRINT_DEC, e->count);
310 fprintf (file, " (%.1f%%)", e->count * 100.0 / bb->count);
314 fprintf (file, "\n");
317 /* We can not predict the probabilities of outgoing edges of bb. Set them
318 evenly and hope for the best. */
319 static void
320 set_even_probabilities (basic_block bb)
322 int nedges = 0;
323 edge e;
325 for (e = bb->succ; e; e = e->succ_next)
326 if (!(e->flags & (EDGE_EH | EDGE_FAKE)))
327 nedges ++;
328 for (e = bb->succ; e; e = e->succ_next)
329 if (!(e->flags & (EDGE_EH | EDGE_FAKE)))
330 e->probability = (REG_BR_PROB_BASE + nedges / 2) / nedges;
331 else
332 e->probability = 0;
335 /* Combine all REG_BR_PRED notes into single probability and attach REG_BR_PROB
336 note if not already present. Remove now useless REG_BR_PRED notes. */
338 static void
339 combine_predictions_for_insn (rtx insn, basic_block bb)
341 rtx prob_note;
342 rtx *pnote;
343 rtx note;
344 int best_probability = PROB_EVEN;
345 int best_predictor = END_PREDICTORS;
346 int combined_probability = REG_BR_PROB_BASE / 2;
347 int d;
348 bool first_match = false;
349 bool found = false;
351 if (!can_predict_insn_p (insn))
353 set_even_probabilities (bb);
354 return;
357 prob_note = find_reg_note (insn, REG_BR_PROB, 0);
358 pnote = &REG_NOTES (insn);
359 if (dump_file)
360 fprintf (dump_file, "Predictions for insn %i bb %i\n", INSN_UID (insn),
361 bb->index);
363 /* We implement "first match" heuristics and use probability guessed
364 by predictor with smallest index. */
365 for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
366 if (REG_NOTE_KIND (note) == REG_BR_PRED)
368 int predictor = INTVAL (XEXP (XEXP (note, 0), 0));
369 int probability = INTVAL (XEXP (XEXP (note, 0), 1));
371 found = true;
372 if (best_predictor > predictor)
373 best_probability = probability, best_predictor = predictor;
375 d = (combined_probability * probability
376 + (REG_BR_PROB_BASE - combined_probability)
377 * (REG_BR_PROB_BASE - probability));
379 /* Use FP math to avoid overflows of 32bit integers. */
380 if (d == 0)
381 /* If one probability is 0% and one 100%, avoid division by zero. */
382 combined_probability = REG_BR_PROB_BASE / 2;
383 else
384 combined_probability = (((double) combined_probability) * probability
385 * REG_BR_PROB_BASE / d + 0.5);
388 /* Decide which heuristic to use. In case we didn't match anything,
389 use no_prediction heuristic, in case we did match, use either
390 first match or Dempster-Shaffer theory depending on the flags. */
392 if (predictor_info [best_predictor].flags & PRED_FLAG_FIRST_MATCH)
393 first_match = true;
395 if (!found)
396 dump_prediction (dump_file, PRED_NO_PREDICTION,
397 combined_probability, bb, true);
398 else
400 dump_prediction (dump_file, PRED_DS_THEORY, combined_probability,
401 bb, !first_match);
402 dump_prediction (dump_file, PRED_FIRST_MATCH, best_probability,
403 bb, first_match);
406 if (first_match)
407 combined_probability = best_probability;
408 dump_prediction (dump_file, PRED_COMBINED, combined_probability, bb, true);
410 while (*pnote)
412 if (REG_NOTE_KIND (*pnote) == REG_BR_PRED)
414 int predictor = INTVAL (XEXP (XEXP (*pnote, 0), 0));
415 int probability = INTVAL (XEXP (XEXP (*pnote, 0), 1));
417 dump_prediction (dump_file, predictor, probability, bb,
418 !first_match || best_predictor == predictor);
419 *pnote = XEXP (*pnote, 1);
421 else
422 pnote = &XEXP (*pnote, 1);
425 if (!prob_note)
427 REG_NOTES (insn)
428 = gen_rtx_EXPR_LIST (REG_BR_PROB,
429 GEN_INT (combined_probability), REG_NOTES (insn));
431 /* Save the prediction into CFG in case we are seeing non-degenerated
432 conditional jump. */
433 if (bb->succ->succ_next)
435 BRANCH_EDGE (bb)->probability = combined_probability;
436 FALLTHRU_EDGE (bb)->probability
437 = REG_BR_PROB_BASE - combined_probability;
442 /* Combine predictions into single probability and store them into CFG.
443 Remove now useless prediction entries. */
445 static void
446 combine_predictions_for_bb (FILE *file, basic_block bb)
448 int best_probability = PROB_EVEN;
449 int best_predictor = END_PREDICTORS;
450 int combined_probability = REG_BR_PROB_BASE / 2;
451 int d;
452 bool first_match = false;
453 bool found = false;
454 struct edge_prediction *pred;
455 int nedges = 0;
456 edge e, first = NULL, second = NULL;
458 for (e = bb->succ; e; e = e->succ_next)
459 if (!(e->flags & (EDGE_EH | EDGE_FAKE)))
461 nedges ++;
462 if (first && !second)
463 second = e;
464 if (!first)
465 first = e;
468 /* When there is no successor or only one choice, prediction is easy.
470 We are lazy for now and predict only basic blocks with two outgoing
471 edges. It is possible to predict generic case too, but we have to
472 ignore first match heuristics and do more involved combining. Implement
473 this later. */
474 if (nedges != 2)
476 if (!bb->count)
477 set_even_probabilities (bb);
478 bb_ann (bb)->predictions = NULL;
479 if (file)
480 fprintf (file, "%i edges in bb %i predicted to even probabilities\n",
481 nedges, bb->index);
482 return;
485 if (file)
486 fprintf (file, "Predictions for bb %i\n", bb->index);
488 /* We implement "first match" heuristics and use probability guessed
489 by predictor with smallest index. */
490 for (pred = bb_ann (bb)->predictions; pred; pred = pred->next)
492 int predictor = pred->predictor;
493 int probability = pred->probability;
495 if (pred->edge != first)
496 probability = REG_BR_PROB_BASE - probability;
498 found = true;
499 if (best_predictor > predictor)
500 best_probability = probability, best_predictor = predictor;
502 d = (combined_probability * probability
503 + (REG_BR_PROB_BASE - combined_probability)
504 * (REG_BR_PROB_BASE - probability));
506 /* Use FP math to avoid overflows of 32bit integers. */
507 if (d == 0)
508 /* If one probability is 0% and one 100%, avoid division by zero. */
509 combined_probability = REG_BR_PROB_BASE / 2;
510 else
511 combined_probability = (((double) combined_probability) * probability
512 * REG_BR_PROB_BASE / d + 0.5);
515 /* Decide which heuristic to use. In case we didn't match anything,
516 use no_prediction heuristic, in case we did match, use either
517 first match or Dempster-Shaffer theory depending on the flags. */
519 if (predictor_info [best_predictor].flags & PRED_FLAG_FIRST_MATCH)
520 first_match = true;
522 if (!found)
523 dump_prediction (file, PRED_NO_PREDICTION, combined_probability, bb, true);
524 else
526 dump_prediction (file, PRED_DS_THEORY, combined_probability, bb,
527 !first_match);
528 dump_prediction (file, PRED_FIRST_MATCH, best_probability, bb,
529 first_match);
532 if (first_match)
533 combined_probability = best_probability;
534 dump_prediction (file, PRED_COMBINED, combined_probability, bb, true);
536 for (pred = bb_ann (bb)->predictions; pred; pred = pred->next)
538 int predictor = pred->predictor;
539 int probability = pred->probability;
541 if (pred->edge != bb->succ)
542 probability = REG_BR_PROB_BASE - probability;
543 dump_prediction (file, predictor, probability, bb,
544 !first_match || best_predictor == predictor);
546 bb_ann (bb)->predictions = NULL;
548 if (!bb->count)
550 first->probability = combined_probability;
551 second->probability = REG_BR_PROB_BASE - combined_probability;
555 /* Predict edge probabilities by exploiting loop structure.
556 When RTLSIMPLELOOPS is set, attempt to count number of iterations by analyzing
557 RTL otherwise use tree based approach. */
558 static void
559 predict_loops (struct loops *loops_info, bool rtlsimpleloops)
561 unsigned i;
563 if (!rtlsimpleloops)
564 scev_initialize (loops_info);
566 /* Try to predict out blocks in a loop that are not part of a
567 natural loop. */
568 for (i = 1; i < loops_info->num; i++)
570 basic_block bb, *bbs;
571 unsigned j;
572 int exits;
573 struct loop *loop = loops_info->parray[i];
574 struct niter_desc desc;
575 unsigned HOST_WIDE_INT niter;
577 flow_loop_scan (loop, LOOP_EXIT_EDGES);
578 exits = loop->num_exits;
580 if (rtlsimpleloops)
582 iv_analysis_loop_init (loop);
583 find_simple_exit (loop, &desc);
585 if (desc.simple_p && desc.const_iter)
587 int prob;
588 niter = desc.niter + 1;
589 if (niter == 0) /* We might overflow here. */
590 niter = desc.niter;
592 prob = (REG_BR_PROB_BASE
593 - (REG_BR_PROB_BASE + niter /2) / niter);
594 /* Branch prediction algorithm gives 0 frequency for everything
595 after the end of loop for loop having 0 probability to finish. */
596 if (prob == REG_BR_PROB_BASE)
597 prob = REG_BR_PROB_BASE - 1;
598 predict_edge (desc.in_edge, PRED_LOOP_ITERATIONS,
599 prob);
602 else
604 edge *exits;
605 unsigned j, n_exits;
606 struct tree_niter_desc niter_desc;
608 exits = get_loop_exit_edges (loop, &n_exits);
609 for (j = 0; j < n_exits; j++)
611 tree niter = NULL;
613 if (number_of_iterations_exit (loop, exits[j], &niter_desc))
614 niter = niter_desc.niter;
615 if (!niter || TREE_CODE (niter_desc.niter) != INTEGER_CST)
616 niter = loop_niter_by_eval (loop, exits[j]);
618 if (TREE_CODE (niter) == INTEGER_CST)
620 int probability;
621 if (host_integerp (niter, 1)
622 && tree_int_cst_lt (niter,
623 build_int_cstu (NULL_TREE,
624 REG_BR_PROB_BASE - 1)))
626 HOST_WIDE_INT nitercst = tree_low_cst (niter, 1) + 1;
627 probability = (REG_BR_PROB_BASE + nitercst / 2) / nitercst;
629 else
630 probability = 1;
632 predict_edge (exits[j], PRED_LOOP_ITERATIONS, probability);
636 free (exits);
639 bbs = get_loop_body (loop);
641 for (j = 0; j < loop->num_nodes; j++)
643 int header_found = 0;
644 edge e;
646 bb = bbs[j];
648 /* Bypass loop heuristics on continue statement. These
649 statements construct loops via "non-loop" constructs
650 in the source language and are better to be handled
651 separately. */
652 if ((rtlsimpleloops && !can_predict_insn_p (BB_END (bb)))
653 || predicted_by_p (bb, PRED_CONTINUE))
654 continue;
656 /* Loop branch heuristics - predict an edge back to a
657 loop's head as taken. */
658 for (e = bb->succ; e; e = e->succ_next)
659 if (e->dest == loop->header
660 && e->src == loop->latch)
662 header_found = 1;
663 predict_edge_def (e, PRED_LOOP_BRANCH, TAKEN);
666 /* Loop exit heuristics - predict an edge exiting the loop if the
667 conditional has no loop header successors as not taken. */
668 if (!header_found)
669 for (e = bb->succ; e; e = e->succ_next)
670 if (e->dest->index < 0
671 || !flow_bb_inside_loop_p (loop, e->dest))
672 predict_edge
673 (e, PRED_LOOP_EXIT,
674 (REG_BR_PROB_BASE
675 - predictor_info [(int) PRED_LOOP_EXIT].hitrate)
676 / exits);
679 /* Free basic blocks from get_loop_body. */
680 free (bbs);
683 if (!rtlsimpleloops)
684 scev_reset ();
687 /* Attempt to predict probabilities of BB outgoing edges using local
688 properties. */
689 static void
690 bb_estimate_probability_locally (basic_block bb)
692 rtx last_insn = BB_END (bb);
693 rtx cond;
695 if (! can_predict_insn_p (last_insn))
696 return;
697 cond = get_condition (last_insn, NULL, false, false);
698 if (! cond)
699 return;
701 /* Try "pointer heuristic."
702 A comparison ptr == 0 is predicted as false.
703 Similarly, a comparison ptr1 == ptr2 is predicted as false. */
704 if (COMPARISON_P (cond)
705 && ((REG_P (XEXP (cond, 0)) && REG_POINTER (XEXP (cond, 0)))
706 || (REG_P (XEXP (cond, 1)) && REG_POINTER (XEXP (cond, 1)))))
708 if (GET_CODE (cond) == EQ)
709 predict_insn_def (last_insn, PRED_POINTER, NOT_TAKEN);
710 else if (GET_CODE (cond) == NE)
711 predict_insn_def (last_insn, PRED_POINTER, TAKEN);
713 else
715 /* Try "opcode heuristic."
716 EQ tests are usually false and NE tests are usually true. Also,
717 most quantities are positive, so we can make the appropriate guesses
718 about signed comparisons against zero. */
719 switch (GET_CODE (cond))
721 case CONST_INT:
722 /* Unconditional branch. */
723 predict_insn_def (last_insn, PRED_UNCONDITIONAL,
724 cond == const0_rtx ? NOT_TAKEN : TAKEN);
725 break;
727 case EQ:
728 case UNEQ:
729 /* Floating point comparisons appears to behave in a very
730 unpredictable way because of special role of = tests in
731 FP code. */
732 if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
734 /* Comparisons with 0 are often used for booleans and there is
735 nothing useful to predict about them. */
736 else if (XEXP (cond, 1) == const0_rtx
737 || XEXP (cond, 0) == const0_rtx)
739 else
740 predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, NOT_TAKEN);
741 break;
743 case NE:
744 case LTGT:
745 /* Floating point comparisons appears to behave in a very
746 unpredictable way because of special role of = tests in
747 FP code. */
748 if (FLOAT_MODE_P (GET_MODE (XEXP (cond, 0))))
750 /* Comparisons with 0 are often used for booleans and there is
751 nothing useful to predict about them. */
752 else if (XEXP (cond, 1) == const0_rtx
753 || XEXP (cond, 0) == const0_rtx)
755 else
756 predict_insn_def (last_insn, PRED_OPCODE_NONEQUAL, TAKEN);
757 break;
759 case ORDERED:
760 predict_insn_def (last_insn, PRED_FPOPCODE, TAKEN);
761 break;
763 case UNORDERED:
764 predict_insn_def (last_insn, PRED_FPOPCODE, NOT_TAKEN);
765 break;
767 case LE:
768 case LT:
769 if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
770 || XEXP (cond, 1) == constm1_rtx)
771 predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, NOT_TAKEN);
772 break;
774 case GE:
775 case GT:
776 if (XEXP (cond, 1) == const0_rtx || XEXP (cond, 1) == const1_rtx
777 || XEXP (cond, 1) == constm1_rtx)
778 predict_insn_def (last_insn, PRED_OPCODE_POSITIVE, TAKEN);
779 break;
781 default:
782 break;
786 /* Statically estimate the probability that a branch will be taken and produce
787 estimated profile. When profile feedback is present never executed portions
788 of function gets estimated. */
790 void
791 estimate_probability (struct loops *loops_info)
793 basic_block bb;
795 connect_infinite_loops_to_exit ();
796 calculate_dominance_info (CDI_DOMINATORS);
797 calculate_dominance_info (CDI_POST_DOMINATORS);
799 predict_loops (loops_info, true);
801 iv_analysis_done ();
803 /* Attempt to predict conditional jumps using a number of heuristics. */
804 FOR_EACH_BB (bb)
806 rtx last_insn = BB_END (bb);
807 edge e;
809 if (! can_predict_insn_p (last_insn))
810 continue;
812 for (e = bb->succ; e; e = e->succ_next)
814 /* Predict early returns to be probable, as we've already taken
815 care for error returns and other are often used for fast paths
816 trought function. */
817 if ((e->dest == EXIT_BLOCK_PTR
818 || (e->dest->succ && !e->dest->succ->succ_next
819 && e->dest->succ->dest == EXIT_BLOCK_PTR))
820 && !predicted_by_p (bb, PRED_NULL_RETURN)
821 && !predicted_by_p (bb, PRED_CONST_RETURN)
822 && !predicted_by_p (bb, PRED_NEGATIVE_RETURN)
823 && !last_basic_block_p (e->dest))
824 predict_edge_def (e, PRED_EARLY_RETURN, TAKEN);
826 /* Look for block we are guarding (ie we dominate it,
827 but it doesn't postdominate us). */
828 if (e->dest != EXIT_BLOCK_PTR && e->dest != bb
829 && dominated_by_p (CDI_DOMINATORS, e->dest, e->src)
830 && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e->dest))
832 rtx insn;
834 /* The call heuristic claims that a guarded function call
835 is improbable. This is because such calls are often used
836 to signal exceptional situations such as printing error
837 messages. */
838 for (insn = BB_HEAD (e->dest); insn != NEXT_INSN (BB_END (e->dest));
839 insn = NEXT_INSN (insn))
840 if (CALL_P (insn)
841 /* Constant and pure calls are hardly used to signalize
842 something exceptional. */
843 && ! CONST_OR_PURE_CALL_P (insn))
845 predict_edge_def (e, PRED_CALL, NOT_TAKEN);
846 break;
850 bb_estimate_probability_locally (bb);
853 /* Attach the combined probability to each conditional jump. */
854 FOR_EACH_BB (bb)
855 if (JUMP_P (BB_END (bb))
856 && any_condjump_p (BB_END (bb))
857 && bb->succ->succ_next != NULL)
858 combine_predictions_for_insn (BB_END (bb), bb);
860 remove_fake_exit_edges ();
861 /* Fill in the probability values in flowgraph based on the REG_BR_PROB
862 notes. */
863 FOR_EACH_BB (bb)
865 rtx last_insn = BB_END (bb);
867 if (!can_predict_insn_p (last_insn))
869 /* We can predict only conditional jumps at the moment.
870 Expect each edge to be equally probable.
871 ?? In the future we want to make abnormal edges improbable. */
872 int nedges = 0;
873 edge e;
875 for (e = bb->succ; e; e = e->succ_next)
877 nedges++;
878 if (e->probability != 0)
879 break;
881 if (!e)
882 for (e = bb->succ; e; e = e->succ_next)
883 e->probability = (REG_BR_PROB_BASE + nedges / 2) / nedges;
886 estimate_bb_frequencies (loops_info);
887 free_dominance_info (CDI_POST_DOMINATORS);
888 if (profile_status == PROFILE_ABSENT)
889 profile_status = PROFILE_GUESSED;
892 /* Set edge->probability for each successor edge of BB. */
893 void
894 guess_outgoing_edge_probabilities (basic_block bb)
896 bb_estimate_probability_locally (bb);
897 combine_predictions_for_insn (BB_END (bb), bb);
901 /* Predict using opcode of the last statement in basic block. */
902 static void
903 tree_predict_by_opcode (basic_block bb)
905 tree stmt = last_stmt (bb);
906 edge then_edge;
907 tree cond;
908 tree op0;
909 tree type;
911 if (!stmt || TREE_CODE (stmt) != COND_EXPR)
912 return;
913 for (then_edge = bb->succ; then_edge; then_edge = then_edge->succ_next)
914 if (then_edge->flags & EDGE_TRUE_VALUE)
915 break;
916 cond = TREE_OPERAND (stmt, 0);
917 if (TREE_CODE_CLASS (TREE_CODE (cond)) != '<')
918 return;
919 op0 = TREE_OPERAND (cond, 0);
920 type = TREE_TYPE (op0);
921 /* Try "pointer heuristic."
922 A comparison ptr == 0 is predicted as false.
923 Similarly, a comparison ptr1 == ptr2 is predicted as false. */
924 if (POINTER_TYPE_P (type))
926 if (TREE_CODE (cond) == EQ_EXPR)
927 predict_edge_def (then_edge, PRED_TREE_POINTER, NOT_TAKEN);
928 else if (TREE_CODE (cond) == NE_EXPR)
929 predict_edge_def (then_edge, PRED_TREE_POINTER, TAKEN);
931 else
933 /* Try "opcode heuristic."
934 EQ tests are usually false and NE tests are usually true. Also,
935 most quantities are positive, so we can make the appropriate guesses
936 about signed comparisons against zero. */
937 switch (TREE_CODE (cond))
939 case EQ_EXPR:
940 case UNEQ_EXPR:
941 /* Floating point comparisons appears to behave in a very
942 unpredictable way because of special role of = tests in
943 FP code. */
944 if (FLOAT_TYPE_P (type))
946 /* Comparisons with 0 are often used for booleans and there is
947 nothing useful to predict about them. */
948 else if (integer_zerop (op0)
949 || integer_zerop (TREE_OPERAND (cond, 1)))
951 else
952 predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, NOT_TAKEN);
953 break;
955 case NE_EXPR:
956 case LTGT_EXPR:
957 /* Floating point comparisons appears to behave in a very
958 unpredictable way because of special role of = tests in
959 FP code. */
960 if (FLOAT_TYPE_P (type))
962 /* Comparisons with 0 are often used for booleans and there is
963 nothing useful to predict about them. */
964 else if (integer_zerop (op0)
965 || integer_zerop (TREE_OPERAND (cond, 1)))
967 else
968 predict_edge_def (then_edge, PRED_TREE_OPCODE_NONEQUAL, TAKEN);
969 break;
971 case ORDERED_EXPR:
972 predict_edge_def (then_edge, PRED_TREE_FPOPCODE, TAKEN);
973 break;
975 case UNORDERED_EXPR:
976 predict_edge_def (then_edge, PRED_TREE_FPOPCODE, NOT_TAKEN);
977 break;
979 case LE_EXPR:
980 case LT_EXPR:
981 if (integer_zerop (TREE_OPERAND (cond, 1))
982 || integer_onep (TREE_OPERAND (cond, 1))
983 || integer_all_onesp (TREE_OPERAND (cond, 1))
984 || real_zerop (TREE_OPERAND (cond, 1))
985 || real_onep (TREE_OPERAND (cond, 1))
986 || real_minus_onep (TREE_OPERAND (cond, 1)))
987 predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, NOT_TAKEN);
988 break;
990 case GE_EXPR:
991 case GT_EXPR:
992 if (integer_zerop (TREE_OPERAND (cond, 1))
993 || integer_onep (TREE_OPERAND (cond, 1))
994 || integer_all_onesp (TREE_OPERAND (cond, 1))
995 || real_zerop (TREE_OPERAND (cond, 1))
996 || real_onep (TREE_OPERAND (cond, 1))
997 || real_minus_onep (TREE_OPERAND (cond, 1)))
998 predict_edge_def (then_edge, PRED_TREE_OPCODE_POSITIVE, TAKEN);
999 break;
1001 default:
1002 break;
1006 /* Predict branch probabilities and estimate profile of the tree CFG. */
1007 static void
1008 tree_estimate_probability (void)
1010 basic_block bb;
1011 struct loops loops_info;
1013 flow_loops_find (&loops_info, LOOP_TREE);
1014 if (dump_file && (dump_flags & TDF_DETAILS))
1015 flow_loops_dump (&loops_info, dump_file, NULL, 0);
1017 connect_infinite_loops_to_exit ();
1018 calculate_dominance_info (CDI_DOMINATORS);
1019 calculate_dominance_info (CDI_POST_DOMINATORS);
1021 predict_loops (&loops_info, false);
1023 FOR_EACH_BB (bb)
1025 edge e;
1027 for (e = bb->succ; e; e = e->succ_next)
1029 /* Predict early returns to be probable, as we've already taken
1030 care for error returns and other are often used for fast paths
1031 trought function. */
1032 if ((e->dest == EXIT_BLOCK_PTR
1033 || (e->dest->succ && !e->dest->succ->succ_next
1034 && e->dest->succ->dest == EXIT_BLOCK_PTR))
1035 && !predicted_by_p (bb, PRED_NULL_RETURN)
1036 && !predicted_by_p (bb, PRED_CONST_RETURN)
1037 && !predicted_by_p (bb, PRED_NEGATIVE_RETURN)
1038 && !last_basic_block_p (e->dest))
1039 predict_edge_def (e, PRED_EARLY_RETURN, TAKEN);
1041 /* Look for block we are guarding (ie we dominate it,
1042 but it doesn't postdominate us). */
1043 if (e->dest != EXIT_BLOCK_PTR && e->dest != bb
1044 && dominated_by_p (CDI_DOMINATORS, e->dest, e->src)
1045 && !dominated_by_p (CDI_POST_DOMINATORS, e->src, e->dest))
1047 block_stmt_iterator bi;
1049 /* The call heuristic claims that a guarded function call
1050 is improbable. This is because such calls are often used
1051 to signal exceptional situations such as printing error
1052 messages. */
1053 for (bi = bsi_start (e->dest); !bsi_end_p (bi);
1054 bsi_next (&bi))
1056 tree stmt = bsi_stmt (bi);
1057 if ((TREE_CODE (stmt) == CALL_EXPR
1058 || (TREE_CODE (stmt) == MODIFY_EXPR
1059 && TREE_CODE (TREE_OPERAND (stmt, 1)) == CALL_EXPR))
1060 /* Constant and pure calls are hardly used to signalize
1061 something exceptional. */
1062 && TREE_SIDE_EFFECTS (stmt))
1064 predict_edge_def (e, PRED_CALL, NOT_TAKEN);
1065 break;
1070 tree_predict_by_opcode (bb);
1072 FOR_EACH_BB (bb)
1073 combine_predictions_for_bb (dump_file, bb);
1075 estimate_bb_frequencies (&loops_info);
1076 free_dominance_info (CDI_POST_DOMINATORS);
1077 remove_fake_exit_edges ();
1078 flow_loops_free (&loops_info);
1079 if (dump_file && (dump_flags & TDF_DETAILS))
1080 dump_tree_cfg (dump_file, dump_flags);
1081 if (profile_status == PROFILE_ABSENT)
1082 profile_status = PROFILE_GUESSED;
1085 /* __builtin_expect dropped tokens into the insn stream describing expected
1086 values of registers. Generate branch probabilities based off these
1087 values. */
1089 void
1090 expected_value_to_br_prob (void)
1092 rtx insn, cond, ev = NULL_RTX, ev_reg = NULL_RTX;
1094 for (insn = get_insns (); insn ; insn = NEXT_INSN (insn))
1096 switch (GET_CODE (insn))
1098 case NOTE:
1099 /* Look for expected value notes. */
1100 if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_EXPECTED_VALUE)
1102 ev = NOTE_EXPECTED_VALUE (insn);
1103 ev_reg = XEXP (ev, 0);
1104 delete_insn (insn);
1106 continue;
1108 case CODE_LABEL:
1109 /* Never propagate across labels. */
1110 ev = NULL_RTX;
1111 continue;
1113 case JUMP_INSN:
1114 /* Look for simple conditional branches. If we haven't got an
1115 expected value yet, no point going further. */
1116 if (!JUMP_P (insn) || ev == NULL_RTX
1117 || ! any_condjump_p (insn))
1118 continue;
1119 break;
1121 default:
1122 /* Look for insns that clobber the EV register. */
1123 if (ev && reg_set_p (ev_reg, insn))
1124 ev = NULL_RTX;
1125 continue;
1128 /* Collect the branch condition, hopefully relative to EV_REG. */
1129 /* ??? At present we'll miss things like
1130 (expected_value (eq r70 0))
1131 (set r71 -1)
1132 (set r80 (lt r70 r71))
1133 (set pc (if_then_else (ne r80 0) ...))
1134 as canonicalize_condition will render this to us as
1135 (lt r70, r71)
1136 Could use cselib to try and reduce this further. */
1137 cond = XEXP (SET_SRC (pc_set (insn)), 0);
1138 cond = canonicalize_condition (insn, cond, 0, NULL, ev_reg,
1139 false, false);
1140 if (! cond || XEXP (cond, 0) != ev_reg
1141 || GET_CODE (XEXP (cond, 1)) != CONST_INT)
1142 continue;
1144 /* Substitute and simplify. Given that the expression we're
1145 building involves two constants, we should wind up with either
1146 true or false. */
1147 cond = gen_rtx_fmt_ee (GET_CODE (cond), VOIDmode,
1148 XEXP (ev, 1), XEXP (cond, 1));
1149 cond = simplify_rtx (cond);
1151 /* Turn the condition into a scaled branch probability. */
1152 if (cond != const_true_rtx && cond != const0_rtx)
1153 abort ();
1154 predict_insn_def (insn, PRED_BUILTIN_EXPECT,
1155 cond == const_true_rtx ? TAKEN : NOT_TAKEN);
1159 /* Check whether this is the last basic block of function. Commonly
1160 there is one extra common cleanup block. */
1161 static bool
1162 last_basic_block_p (basic_block bb)
1164 if (bb == EXIT_BLOCK_PTR)
1165 return false;
1167 return (bb->next_bb == EXIT_BLOCK_PTR
1168 || (bb->next_bb->next_bb == EXIT_BLOCK_PTR
1169 && bb->succ && !bb->succ->succ_next
1170 && bb->succ->dest->next_bb == EXIT_BLOCK_PTR));
1173 /* This is used to carry information about basic blocks. It is
1174 attached to the AUX field of the standard CFG block. */
1176 typedef struct block_info_def
1178 /* Estimated frequency of execution of basic_block. */
1179 sreal frequency;
1181 /* To keep queue of basic blocks to process. */
1182 basic_block next;
1184 /* True if block needs to be visited in propagate_freq. */
1185 unsigned int tovisit:1;
1187 /* Number of predecessors we need to visit first. */
1188 int npredecessors;
1189 } *block_info;
1191 /* Similar information for edges. */
1192 typedef struct edge_info_def
1194 /* In case edge is an loopback edge, the probability edge will be reached
1195 in case header is. Estimated number of iterations of the loop can be
1196 then computed as 1 / (1 - back_edge_prob). */
1197 sreal back_edge_prob;
1198 /* True if the edge is an loopback edge in the natural loop. */
1199 unsigned int back_edge:1;
1200 } *edge_info;
1202 #define BLOCK_INFO(B) ((block_info) (B)->aux)
1203 #define EDGE_INFO(E) ((edge_info) (E)->aux)
1205 /* Helper function for estimate_bb_frequencies.
1206 Propagate the frequencies for LOOP. */
1208 static void
1209 propagate_freq (struct loop *loop)
1211 basic_block head = loop->header;
1212 basic_block bb;
1213 basic_block last;
1214 edge e;
1215 basic_block nextbb;
1217 /* For each basic block we need to visit count number of his predecessors
1218 we need to visit first. */
1219 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR, NULL, next_bb)
1221 if (BLOCK_INFO (bb)->tovisit)
1223 int count = 0;
1225 for (e = bb->pred; e; e = e->pred_next)
1226 if (BLOCK_INFO (e->src)->tovisit && !(e->flags & EDGE_DFS_BACK))
1227 count++;
1228 else if (BLOCK_INFO (e->src)->tovisit
1229 && dump_file && !EDGE_INFO (e)->back_edge)
1230 fprintf (dump_file,
1231 "Irreducible region hit, ignoring edge to %i->%i\n",
1232 e->src->index, bb->index);
1233 BLOCK_INFO (bb)->npredecessors = count;
1237 memcpy (&BLOCK_INFO (head)->frequency, &real_one, sizeof (real_one));
1238 last = head;
1239 for (bb = head; bb; bb = nextbb)
1241 sreal cyclic_probability, frequency;
1243 memcpy (&cyclic_probability, &real_zero, sizeof (real_zero));
1244 memcpy (&frequency, &real_zero, sizeof (real_zero));
1246 nextbb = BLOCK_INFO (bb)->next;
1247 BLOCK_INFO (bb)->next = NULL;
1249 /* Compute frequency of basic block. */
1250 if (bb != head)
1252 #ifdef ENABLE_CHECKING
1253 for (e = bb->pred; e; e = e->pred_next)
1254 if (BLOCK_INFO (e->src)->tovisit && !(e->flags & EDGE_DFS_BACK))
1255 abort ();
1256 #endif
1258 for (e = bb->pred; e; e = e->pred_next)
1259 if (EDGE_INFO (e)->back_edge)
1261 sreal_add (&cyclic_probability, &cyclic_probability,
1262 &EDGE_INFO (e)->back_edge_prob);
1264 else if (!(e->flags & EDGE_DFS_BACK))
1266 sreal tmp;
1268 /* frequency += (e->probability
1269 * BLOCK_INFO (e->src)->frequency /
1270 REG_BR_PROB_BASE); */
1272 sreal_init (&tmp, e->probability, 0);
1273 sreal_mul (&tmp, &tmp, &BLOCK_INFO (e->src)->frequency);
1274 sreal_mul (&tmp, &tmp, &real_inv_br_prob_base);
1275 sreal_add (&frequency, &frequency, &tmp);
1278 if (sreal_compare (&cyclic_probability, &real_zero) == 0)
1280 memcpy (&BLOCK_INFO (bb)->frequency, &frequency,
1281 sizeof (frequency));
1283 else
1285 if (sreal_compare (&cyclic_probability, &real_almost_one) > 0)
1287 memcpy (&cyclic_probability, &real_almost_one,
1288 sizeof (real_almost_one));
1291 /* BLOCK_INFO (bb)->frequency = frequency
1292 / (1 - cyclic_probability) */
1294 sreal_sub (&cyclic_probability, &real_one, &cyclic_probability);
1295 sreal_div (&BLOCK_INFO (bb)->frequency,
1296 &frequency, &cyclic_probability);
1300 BLOCK_INFO (bb)->tovisit = 0;
1302 /* Compute back edge frequencies. */
1303 for (e = bb->succ; e; e = e->succ_next)
1304 if (e->dest == head)
1306 sreal tmp;
1308 /* EDGE_INFO (e)->back_edge_prob
1309 = ((e->probability * BLOCK_INFO (bb)->frequency)
1310 / REG_BR_PROB_BASE); */
1312 sreal_init (&tmp, e->probability, 0);
1313 sreal_mul (&tmp, &tmp, &BLOCK_INFO (bb)->frequency);
1314 sreal_mul (&EDGE_INFO (e)->back_edge_prob,
1315 &tmp, &real_inv_br_prob_base);
1318 /* Propagate to successor blocks. */
1319 for (e = bb->succ; e; e = e->succ_next)
1320 if (!(e->flags & EDGE_DFS_BACK)
1321 && BLOCK_INFO (e->dest)->npredecessors)
1323 BLOCK_INFO (e->dest)->npredecessors--;
1324 if (!BLOCK_INFO (e->dest)->npredecessors)
1326 if (!nextbb)
1327 nextbb = e->dest;
1328 else
1329 BLOCK_INFO (last)->next = e->dest;
1331 last = e->dest;
1337 /* Estimate probabilities of loopback edges in loops at same nest level. */
1339 static void
1340 estimate_loops_at_level (struct loop *first_loop)
1342 struct loop *loop;
1344 for (loop = first_loop; loop; loop = loop->next)
1346 edge e;
1347 basic_block *bbs;
1348 unsigned i;
1350 estimate_loops_at_level (loop->inner);
1352 if (loop->latch->succ) /* Do not do this for dummy function loop. */
1354 /* Find current loop back edge and mark it. */
1355 e = loop_latch_edge (loop);
1356 EDGE_INFO (e)->back_edge = 1;
1359 bbs = get_loop_body (loop);
1360 for (i = 0; i < loop->num_nodes; i++)
1361 BLOCK_INFO (bbs[i])->tovisit = 1;
1362 free (bbs);
1363 propagate_freq (loop);
1367 /* Convert counts measured by profile driven feedback to frequencies.
1368 Return nonzero iff there was any nonzero execution count. */
1370 static int
1371 counts_to_freqs (void)
1373 gcov_type count_max, true_count_max = 0;
1374 basic_block bb;
1376 FOR_EACH_BB (bb)
1377 true_count_max = MAX (bb->count, true_count_max);
1379 count_max = MAX (true_count_max, 1);
1380 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR, NULL, next_bb)
1381 bb->frequency = (bb->count * BB_FREQ_MAX + count_max / 2) / count_max;
1382 return true_count_max;
1385 /* Return true if function is likely to be expensive, so there is no point to
1386 optimize performance of prologue, epilogue or do inlining at the expense
1387 of code size growth. THRESHOLD is the limit of number of instructions
1388 function can execute at average to be still considered not expensive. */
1390 bool
1391 expensive_function_p (int threshold)
1393 unsigned int sum = 0;
1394 basic_block bb;
1395 unsigned int limit;
1397 /* We can not compute accurately for large thresholds due to scaled
1398 frequencies. */
1399 if (threshold > BB_FREQ_MAX)
1400 abort ();
1402 /* Frequencies are out of range. This either means that function contains
1403 internal loop executing more than BB_FREQ_MAX times or profile feedback
1404 is available and function has not been executed at all. */
1405 if (ENTRY_BLOCK_PTR->frequency == 0)
1406 return true;
1408 /* Maximally BB_FREQ_MAX^2 so overflow won't happen. */
1409 limit = ENTRY_BLOCK_PTR->frequency * threshold;
1410 FOR_EACH_BB (bb)
1412 rtx insn;
1414 for (insn = BB_HEAD (bb); insn != NEXT_INSN (BB_END (bb));
1415 insn = NEXT_INSN (insn))
1416 if (active_insn_p (insn))
1418 sum += bb->frequency;
1419 if (sum > limit)
1420 return true;
1424 return false;
1427 /* Estimate basic blocks frequency by given branch probabilities. */
1429 static void
1430 estimate_bb_frequencies (struct loops *loops)
1432 basic_block bb;
1433 sreal freq_max;
1435 if (!flag_branch_probabilities || !counts_to_freqs ())
1437 static int real_values_initialized = 0;
1439 if (!real_values_initialized)
1441 real_values_initialized = 1;
1442 sreal_init (&real_zero, 0, 0);
1443 sreal_init (&real_one, 1, 0);
1444 sreal_init (&real_br_prob_base, REG_BR_PROB_BASE, 0);
1445 sreal_init (&real_bb_freq_max, BB_FREQ_MAX, 0);
1446 sreal_init (&real_one_half, 1, -1);
1447 sreal_div (&real_inv_br_prob_base, &real_one, &real_br_prob_base);
1448 sreal_sub (&real_almost_one, &real_one, &real_inv_br_prob_base);
1451 mark_dfs_back_edges ();
1453 ENTRY_BLOCK_PTR->succ->probability = REG_BR_PROB_BASE;
1455 /* Set up block info for each basic block. */
1456 alloc_aux_for_blocks (sizeof (struct block_info_def));
1457 alloc_aux_for_edges (sizeof (struct edge_info_def));
1458 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR, NULL, next_bb)
1460 edge e;
1462 BLOCK_INFO (bb)->tovisit = 0;
1463 for (e = bb->succ; e; e = e->succ_next)
1465 sreal_init (&EDGE_INFO (e)->back_edge_prob, e->probability, 0);
1466 sreal_mul (&EDGE_INFO (e)->back_edge_prob,
1467 &EDGE_INFO (e)->back_edge_prob,
1468 &real_inv_br_prob_base);
1472 /* First compute probabilities locally for each loop from innermost
1473 to outermost to examine probabilities for back edges. */
1474 estimate_loops_at_level (loops->tree_root);
1476 memcpy (&freq_max, &real_zero, sizeof (real_zero));
1477 FOR_EACH_BB (bb)
1478 if (sreal_compare (&freq_max, &BLOCK_INFO (bb)->frequency) < 0)
1479 memcpy (&freq_max, &BLOCK_INFO (bb)->frequency, sizeof (freq_max));
1481 sreal_div (&freq_max, &real_bb_freq_max, &freq_max);
1482 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR, NULL, next_bb)
1484 sreal tmp;
1486 sreal_mul (&tmp, &BLOCK_INFO (bb)->frequency, &freq_max);
1487 sreal_add (&tmp, &tmp, &real_one_half);
1488 bb->frequency = sreal_to_int (&tmp);
1491 free_aux_for_blocks ();
1492 free_aux_for_edges ();
1494 compute_function_frequency ();
1495 if (flag_reorder_functions)
1496 choose_function_section ();
1499 /* Decide whether function is hot, cold or unlikely executed. */
1500 static void
1501 compute_function_frequency (void)
1503 basic_block bb;
1505 if (!profile_info || !flag_branch_probabilities)
1506 return;
1507 cfun->function_frequency = FUNCTION_FREQUENCY_UNLIKELY_EXECUTED;
1508 FOR_EACH_BB (bb)
1510 if (maybe_hot_bb_p (bb))
1512 cfun->function_frequency = FUNCTION_FREQUENCY_HOT;
1513 return;
1515 if (!probably_never_executed_bb_p (bb))
1516 cfun->function_frequency = FUNCTION_FREQUENCY_NORMAL;
1520 /* Choose appropriate section for the function. */
1521 static void
1522 choose_function_section (void)
1524 if (DECL_SECTION_NAME (current_function_decl)
1525 || !targetm.have_named_sections
1526 /* Theoretically we can split the gnu.linkonce text section too,
1527 but this requires more work as the frequency needs to match
1528 for all generated objects so we need to merge the frequency
1529 of all instances. For now just never set frequency for these. */
1530 || DECL_ONE_ONLY (current_function_decl))
1531 return;
1533 /* If we are doing the partitioning optimization, let the optimization
1534 choose the correct section into which to put things. */
1536 if (flag_reorder_blocks_and_partition)
1537 return;
1539 if (cfun->function_frequency == FUNCTION_FREQUENCY_HOT)
1540 DECL_SECTION_NAME (current_function_decl) =
1541 build_string (strlen (HOT_TEXT_SECTION_NAME), HOT_TEXT_SECTION_NAME);
1542 if (cfun->function_frequency == FUNCTION_FREQUENCY_UNLIKELY_EXECUTED)
1543 DECL_SECTION_NAME (current_function_decl) =
1544 build_string (strlen (UNLIKELY_EXECUTED_TEXT_SECTION_NAME),
1545 UNLIKELY_EXECUTED_TEXT_SECTION_NAME);
1549 struct tree_opt_pass pass_profile =
1551 "profile", /* name */
1552 NULL, /* gate */
1553 tree_estimate_probability, /* execute */
1554 NULL, /* sub */
1555 NULL, /* next */
1556 0, /* static_pass_number */
1557 TV_BRANCH_PROB, /* tv_id */
1558 PROP_cfg, /* properties_required */
1559 0, /* properties_provided */
1560 0, /* properties_destroyed */
1561 0, /* todo_flags_start */
1562 TODO_ggc_collect | TODO_verify_ssa, /* todo_flags_finish */
1563 0 /* letter */