arm.c (arm_init_libfuncs): Add __sync_synchronize.
[official-gcc.git] / gcc / value-prof.c
blob9774ca224f5b6aa515a9fa26f7b0007950cef643
1 /* Transformations based on profile information for values.
2 Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008, 2009 Free Software
3 Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "rtl.h"
26 #include "expr.h"
27 #include "hard-reg-set.h"
28 #include "basic-block.h"
29 #include "value-prof.h"
30 #include "output.h"
31 #include "flags.h"
32 #include "insn-config.h"
33 #include "recog.h"
34 #include "optabs.h"
35 #include "regs.h"
36 #include "ggc.h"
37 #include "tree-flow.h"
38 #include "tree-flow-inline.h"
39 #include "diagnostic.h"
40 #include "coverage.h"
41 #include "tree.h"
42 #include "gcov-io.h"
43 #include "cgraph.h"
44 #include "timevar.h"
45 #include "tree-pass.h"
46 #include "toplev.h"
47 #include "pointer-set.h"
49 static struct value_prof_hooks *value_prof_hooks;
51 /* In this file value profile based optimizations are placed. Currently the
52 following optimizations are implemented (for more detailed descriptions
53 see comments at value_profile_transformations):
55 1) Division/modulo specialization. Provided that we can determine that the
56 operands of the division have some special properties, we may use it to
57 produce more effective code.
58 2) Speculative prefetching. If we are able to determine that the difference
59 between addresses accessed by a memory reference is usually constant, we
60 may add the prefetch instructions.
61 FIXME: This transformation was removed together with RTL based value
62 profiling.
64 3) Indirect/virtual call specialization. If we can determine most
65 common function callee in indirect/virtual call. We can use this
66 information to improve code effectiveness (especially info for
67 inliner).
69 Every such optimization should add its requirements for profiled values to
70 insn_values_to_profile function. This function is called from branch_prob
71 in profile.c and the requested values are instrumented by it in the first
72 compilation with -fprofile-arcs. The optimization may then read the
73 gathered data in the second compilation with -fbranch-probabilities.
75 The measured data is pointed to from the histograms
76 field of the statement annotation of the instrumented insns. It is
77 kept as a linked list of struct histogram_value_t's, which contain the
78 same information as above. */
81 static tree gimple_divmod_fixed_value (gimple, tree, int, gcov_type, gcov_type);
82 static tree gimple_mod_pow2 (gimple, int, gcov_type, gcov_type);
83 static tree gimple_mod_subtract (gimple, int, int, int, gcov_type, gcov_type,
84 gcov_type);
85 static bool gimple_divmod_fixed_value_transform (gimple_stmt_iterator *);
86 static bool gimple_mod_pow2_value_transform (gimple_stmt_iterator *);
87 static bool gimple_mod_subtract_transform (gimple_stmt_iterator *);
88 static bool gimple_stringops_transform (gimple_stmt_iterator *);
89 static bool gimple_ic_transform (gimple);
91 /* Allocate histogram value. */
93 static histogram_value
94 gimple_alloc_histogram_value (struct function *fun ATTRIBUTE_UNUSED,
95 enum hist_type type, gimple stmt, tree value)
97 histogram_value hist = (histogram_value) xcalloc (1, sizeof (*hist));
98 hist->hvalue.value = value;
99 hist->hvalue.stmt = stmt;
100 hist->type = type;
101 return hist;
104 /* Hash value for histogram. */
106 static hashval_t
107 histogram_hash (const void *x)
109 return htab_hash_pointer (((const_histogram_value)x)->hvalue.stmt);
112 /* Return nonzero if decl_id of die_struct X is the same as UID of decl *Y. */
114 static int
115 histogram_eq (const void *x, const void *y)
117 return ((const_histogram_value) x)->hvalue.stmt == (const_gimple) y;
120 /* Set histogram for STMT. */
122 static void
123 set_histogram_value (struct function *fun, gimple stmt, histogram_value hist)
125 void **loc;
126 if (!hist && !VALUE_HISTOGRAMS (fun))
127 return;
128 if (!VALUE_HISTOGRAMS (fun))
129 VALUE_HISTOGRAMS (fun) = htab_create (1, histogram_hash,
130 histogram_eq, NULL);
131 loc = htab_find_slot_with_hash (VALUE_HISTOGRAMS (fun), stmt,
132 htab_hash_pointer (stmt),
133 hist ? INSERT : NO_INSERT);
134 if (!hist)
136 if (loc)
137 htab_clear_slot (VALUE_HISTOGRAMS (fun), loc);
138 return;
140 *loc = hist;
143 /* Get histogram list for STMT. */
145 histogram_value
146 gimple_histogram_value (struct function *fun, gimple stmt)
148 if (!VALUE_HISTOGRAMS (fun))
149 return NULL;
150 return (histogram_value) htab_find_with_hash (VALUE_HISTOGRAMS (fun), stmt,
151 htab_hash_pointer (stmt));
154 /* Add histogram for STMT. */
156 void
157 gimple_add_histogram_value (struct function *fun, gimple stmt,
158 histogram_value hist)
160 hist->hvalue.next = gimple_histogram_value (fun, stmt);
161 set_histogram_value (fun, stmt, hist);
165 /* Remove histogram HIST from STMT's histogram list. */
167 void
168 gimple_remove_histogram_value (struct function *fun, gimple stmt,
169 histogram_value hist)
171 histogram_value hist2 = gimple_histogram_value (fun, stmt);
172 if (hist == hist2)
174 set_histogram_value (fun, stmt, hist->hvalue.next);
176 else
178 while (hist2->hvalue.next != hist)
179 hist2 = hist2->hvalue.next;
180 hist2->hvalue.next = hist->hvalue.next;
182 free (hist->hvalue.counters);
183 #ifdef ENABLE_CHECKING
184 memset (hist, 0xab, sizeof (*hist));
185 #endif
186 free (hist);
190 /* Lookup histogram of type TYPE in the STMT. */
192 histogram_value
193 gimple_histogram_value_of_type (struct function *fun, gimple stmt,
194 enum hist_type type)
196 histogram_value hist;
197 for (hist = gimple_histogram_value (fun, stmt); hist;
198 hist = hist->hvalue.next)
199 if (hist->type == type)
200 return hist;
201 return NULL;
204 /* Dump information about HIST to DUMP_FILE. */
206 static void
207 dump_histogram_value (FILE *dump_file, histogram_value hist)
209 switch (hist->type)
211 case HIST_TYPE_INTERVAL:
212 fprintf (dump_file, "Interval counter range %d -- %d",
213 hist->hdata.intvl.int_start,
214 (hist->hdata.intvl.int_start
215 + hist->hdata.intvl.steps - 1));
216 if (hist->hvalue.counters)
218 unsigned int i;
219 fprintf(dump_file, " [");
220 for (i = 0; i < hist->hdata.intvl.steps; i++)
221 fprintf (dump_file, " %d:"HOST_WIDEST_INT_PRINT_DEC,
222 hist->hdata.intvl.int_start + i,
223 (HOST_WIDEST_INT) hist->hvalue.counters[i]);
224 fprintf (dump_file, " ] outside range:"HOST_WIDEST_INT_PRINT_DEC,
225 (HOST_WIDEST_INT) hist->hvalue.counters[i]);
227 fprintf (dump_file, ".\n");
228 break;
230 case HIST_TYPE_POW2:
231 fprintf (dump_file, "Pow2 counter ");
232 if (hist->hvalue.counters)
234 fprintf (dump_file, "pow2:"HOST_WIDEST_INT_PRINT_DEC
235 " nonpow2:"HOST_WIDEST_INT_PRINT_DEC,
236 (HOST_WIDEST_INT) hist->hvalue.counters[0],
237 (HOST_WIDEST_INT) hist->hvalue.counters[1]);
239 fprintf (dump_file, ".\n");
240 break;
242 case HIST_TYPE_SINGLE_VALUE:
243 fprintf (dump_file, "Single value ");
244 if (hist->hvalue.counters)
246 fprintf (dump_file, "value:"HOST_WIDEST_INT_PRINT_DEC
247 " match:"HOST_WIDEST_INT_PRINT_DEC
248 " wrong:"HOST_WIDEST_INT_PRINT_DEC,
249 (HOST_WIDEST_INT) hist->hvalue.counters[0],
250 (HOST_WIDEST_INT) hist->hvalue.counters[1],
251 (HOST_WIDEST_INT) hist->hvalue.counters[2]);
253 fprintf (dump_file, ".\n");
254 break;
256 case HIST_TYPE_AVERAGE:
257 fprintf (dump_file, "Average value ");
258 if (hist->hvalue.counters)
260 fprintf (dump_file, "sum:"HOST_WIDEST_INT_PRINT_DEC
261 " times:"HOST_WIDEST_INT_PRINT_DEC,
262 (HOST_WIDEST_INT) hist->hvalue.counters[0],
263 (HOST_WIDEST_INT) hist->hvalue.counters[1]);
265 fprintf (dump_file, ".\n");
266 break;
268 case HIST_TYPE_IOR:
269 fprintf (dump_file, "IOR value ");
270 if (hist->hvalue.counters)
272 fprintf (dump_file, "ior:"HOST_WIDEST_INT_PRINT_DEC,
273 (HOST_WIDEST_INT) hist->hvalue.counters[0]);
275 fprintf (dump_file, ".\n");
276 break;
278 case HIST_TYPE_CONST_DELTA:
279 fprintf (dump_file, "Constant delta ");
280 if (hist->hvalue.counters)
282 fprintf (dump_file, "value:"HOST_WIDEST_INT_PRINT_DEC
283 " match:"HOST_WIDEST_INT_PRINT_DEC
284 " wrong:"HOST_WIDEST_INT_PRINT_DEC,
285 (HOST_WIDEST_INT) hist->hvalue.counters[0],
286 (HOST_WIDEST_INT) hist->hvalue.counters[1],
287 (HOST_WIDEST_INT) hist->hvalue.counters[2]);
289 fprintf (dump_file, ".\n");
290 break;
291 case HIST_TYPE_INDIR_CALL:
292 fprintf (dump_file, "Indirect call ");
293 if (hist->hvalue.counters)
295 fprintf (dump_file, "value:"HOST_WIDEST_INT_PRINT_DEC
296 " match:"HOST_WIDEST_INT_PRINT_DEC
297 " all:"HOST_WIDEST_INT_PRINT_DEC,
298 (HOST_WIDEST_INT) hist->hvalue.counters[0],
299 (HOST_WIDEST_INT) hist->hvalue.counters[1],
300 (HOST_WIDEST_INT) hist->hvalue.counters[2]);
302 fprintf (dump_file, ".\n");
303 break;
307 /* Dump all histograms attached to STMT to DUMP_FILE. */
309 void
310 dump_histograms_for_stmt (struct function *fun, FILE *dump_file, gimple stmt)
312 histogram_value hist;
313 for (hist = gimple_histogram_value (fun, stmt); hist; hist = hist->hvalue.next)
314 dump_histogram_value (dump_file, hist);
317 /* Remove all histograms associated with STMT. */
319 void
320 gimple_remove_stmt_histograms (struct function *fun, gimple stmt)
322 histogram_value val;
323 while ((val = gimple_histogram_value (fun, stmt)) != NULL)
324 gimple_remove_histogram_value (fun, stmt, val);
327 /* Duplicate all histograms associates with OSTMT to STMT. */
329 void
330 gimple_duplicate_stmt_histograms (struct function *fun, gimple stmt,
331 struct function *ofun, gimple ostmt)
333 histogram_value val;
334 for (val = gimple_histogram_value (ofun, ostmt); val != NULL; val = val->hvalue.next)
336 histogram_value new_val = gimple_alloc_histogram_value (fun, val->type, NULL, NULL);
337 memcpy (new_val, val, sizeof (*val));
338 new_val->hvalue.stmt = stmt;
339 new_val->hvalue.counters = XNEWVAR (gcov_type, sizeof (*new_val->hvalue.counters) * new_val->n_counters);
340 memcpy (new_val->hvalue.counters, val->hvalue.counters, sizeof (*new_val->hvalue.counters) * new_val->n_counters);
341 gimple_add_histogram_value (fun, stmt, new_val);
346 /* Move all histograms associated with OSTMT to STMT. */
348 void
349 gimple_move_stmt_histograms (struct function *fun, gimple stmt, gimple ostmt)
351 histogram_value val = gimple_histogram_value (fun, ostmt);
352 if (val)
354 /* The following three statements can't be reordered,
355 because histogram hashtab relies on stmt field value
356 for finding the exact slot. */
357 set_histogram_value (fun, ostmt, NULL);
358 for (; val != NULL; val = val->hvalue.next)
359 val->hvalue.stmt = stmt;
360 set_histogram_value (fun, stmt, val);
364 static bool error_found = false;
366 /* Helper function for verify_histograms. For each histogram reachable via htab
367 walk verify that it was reached via statement walk. */
369 static int
370 visit_hist (void **slot, void *data)
372 struct pointer_set_t *visited = (struct pointer_set_t *) data;
373 histogram_value hist = *(histogram_value *) slot;
374 if (!pointer_set_contains (visited, hist))
376 error ("Dead histogram");
377 dump_histogram_value (stderr, hist);
378 debug_gimple_stmt (hist->hvalue.stmt);
379 error_found = true;
381 return 1;
385 /* Verify sanity of the histograms. */
387 void
388 verify_histograms (void)
390 basic_block bb;
391 gimple_stmt_iterator gsi;
392 histogram_value hist;
393 struct pointer_set_t *visited_hists;
395 error_found = false;
396 visited_hists = pointer_set_create ();
397 FOR_EACH_BB (bb)
398 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
400 gimple stmt = gsi_stmt (gsi);
402 for (hist = gimple_histogram_value (cfun, stmt); hist;
403 hist = hist->hvalue.next)
405 if (hist->hvalue.stmt != stmt)
407 error ("Histogram value statement does not correspond to "
408 "the statement it is associated with");
409 debug_gimple_stmt (stmt);
410 dump_histogram_value (stderr, hist);
411 error_found = true;
413 pointer_set_insert (visited_hists, hist);
416 if (VALUE_HISTOGRAMS (cfun))
417 htab_traverse (VALUE_HISTOGRAMS (cfun), visit_hist, visited_hists);
418 pointer_set_destroy (visited_hists);
419 if (error_found)
420 internal_error ("verify_histograms failed");
423 /* Helper function for verify_histograms. For each histogram reachable via htab
424 walk verify that it was reached via statement walk. */
426 static int
427 free_hist (void **slot, void *data ATTRIBUTE_UNUSED)
429 histogram_value hist = *(histogram_value *) slot;
430 free (hist->hvalue.counters);
431 #ifdef ENABLE_CHECKING
432 memset (hist, 0xab, sizeof (*hist));
433 #endif
434 free (hist);
435 return 1;
438 void
439 free_histograms (void)
441 if (VALUE_HISTOGRAMS (cfun))
443 htab_traverse (VALUE_HISTOGRAMS (cfun), free_hist, NULL);
444 htab_delete (VALUE_HISTOGRAMS (cfun));
445 VALUE_HISTOGRAMS (cfun) = NULL;
450 /* The overall number of invocations of the counter should match
451 execution count of basic block. Report it as error rather than
452 internal error as it might mean that user has misused the profile
453 somehow. */
455 static bool
456 check_counter (gimple stmt, const char * name,
457 gcov_type *count, gcov_type *all, gcov_type bb_count)
459 if (*all != bb_count || *count > *all)
461 location_t locus;
462 locus = (stmt != NULL)
463 ? gimple_location (stmt)
464 : DECL_SOURCE_LOCATION (current_function_decl);
465 if (flag_profile_correction)
467 inform (locus, "Correcting inconsistent value profile: "
468 "%s profiler overall count (%d) does not match BB count "
469 "(%d)", name, (int)*all, (int)bb_count);
470 *all = bb_count;
471 if (*count > *all)
472 *count = *all;
473 return false;
475 else
477 error_at (locus, "Corrupted value profile: %s "
478 "profiler overall count (%d) does not match BB count (%d)",
479 name, (int)*all, (int)bb_count);
480 return true;
484 return false;
488 /* GIMPLE based transformations. */
490 static bool
491 gimple_value_profile_transformations (void)
493 basic_block bb;
494 gimple_stmt_iterator gsi;
495 bool changed = false;
497 FOR_EACH_BB (bb)
499 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
501 gimple stmt = gsi_stmt (gsi);
502 histogram_value th = gimple_histogram_value (cfun, stmt);
503 if (!th)
504 continue;
506 if (dump_file)
508 fprintf (dump_file, "Trying transformations on stmt ");
509 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
510 dump_histograms_for_stmt (cfun, dump_file, stmt);
513 /* Transformations: */
514 /* The order of things in this conditional controls which
515 transformation is used when more than one is applicable. */
516 /* It is expected that any code added by the transformations
517 will be added before the current statement, and that the
518 current statement remain valid (although possibly
519 modified) upon return. */
520 if (flag_value_profile_transformations
521 && (gimple_mod_subtract_transform (&gsi)
522 || gimple_divmod_fixed_value_transform (&gsi)
523 || gimple_mod_pow2_value_transform (&gsi)
524 || gimple_stringops_transform (&gsi)
525 || gimple_ic_transform (stmt)))
527 stmt = gsi_stmt (gsi);
528 changed = true;
529 /* Original statement may no longer be in the same block. */
530 if (bb != gimple_bb (stmt))
532 bb = gimple_bb (stmt);
533 gsi = gsi_for_stmt (stmt);
539 if (changed)
541 counts_to_freqs ();
544 return changed;
548 /* Generate code for transformation 1 (with parent gimple assignment
549 STMT and probability of taking the optimal path PROB, which is
550 equivalent to COUNT/ALL within roundoff error). This generates the
551 result into a temp and returns the temp; it does not replace or
552 alter the original STMT. */
554 static tree
555 gimple_divmod_fixed_value (gimple stmt, tree value, int prob, gcov_type count,
556 gcov_type all)
558 gimple stmt1, stmt2, stmt3;
559 tree tmp1, tmp2, tmpv;
560 gimple bb1end, bb2end, bb3end;
561 basic_block bb, bb2, bb3, bb4;
562 tree optype, op1, op2;
563 edge e12, e13, e23, e24, e34;
564 gimple_stmt_iterator gsi;
566 gcc_assert (is_gimple_assign (stmt)
567 && (gimple_assign_rhs_code (stmt) == TRUNC_DIV_EXPR
568 || gimple_assign_rhs_code (stmt) == TRUNC_MOD_EXPR));
570 optype = TREE_TYPE (gimple_assign_lhs (stmt));
571 op1 = gimple_assign_rhs1 (stmt);
572 op2 = gimple_assign_rhs2 (stmt);
574 bb = gimple_bb (stmt);
575 gsi = gsi_for_stmt (stmt);
577 tmpv = create_tmp_var (optype, "PROF");
578 tmp1 = create_tmp_var (optype, "PROF");
579 stmt1 = gimple_build_assign (tmpv, fold_convert (optype, value));
580 stmt2 = gimple_build_assign (tmp1, op2);
581 stmt3 = gimple_build_cond (NE_EXPR, tmp1, tmpv, NULL_TREE, NULL_TREE);
582 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
583 gsi_insert_before (&gsi, stmt2, GSI_SAME_STMT);
584 gsi_insert_before (&gsi, stmt3, GSI_SAME_STMT);
585 bb1end = stmt3;
587 tmp2 = create_tmp_var (optype, "PROF");
588 stmt1 = gimple_build_assign_with_ops (gimple_assign_rhs_code (stmt), tmp2,
589 op1, tmpv);
590 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
591 bb2end = stmt1;
593 stmt1 = gimple_build_assign_with_ops (gimple_assign_rhs_code (stmt), tmp2,
594 op1, op2);
595 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
596 bb3end = stmt1;
598 /* Fix CFG. */
599 /* Edge e23 connects bb2 to bb3, etc. */
600 e12 = split_block (bb, bb1end);
601 bb2 = e12->dest;
602 bb2->count = count;
603 e23 = split_block (bb2, bb2end);
604 bb3 = e23->dest;
605 bb3->count = all - count;
606 e34 = split_block (bb3, bb3end);
607 bb4 = e34->dest;
608 bb4->count = all;
610 e12->flags &= ~EDGE_FALLTHRU;
611 e12->flags |= EDGE_FALSE_VALUE;
612 e12->probability = prob;
613 e12->count = count;
615 e13 = make_edge (bb, bb3, EDGE_TRUE_VALUE);
616 e13->probability = REG_BR_PROB_BASE - prob;
617 e13->count = all - count;
619 remove_edge (e23);
621 e24 = make_edge (bb2, bb4, EDGE_FALLTHRU);
622 e24->probability = REG_BR_PROB_BASE;
623 e24->count = count;
625 e34->probability = REG_BR_PROB_BASE;
626 e34->count = all - count;
628 return tmp2;
632 /* Do transform 1) on INSN if applicable. */
634 static bool
635 gimple_divmod_fixed_value_transform (gimple_stmt_iterator *si)
637 histogram_value histogram;
638 enum tree_code code;
639 gcov_type val, count, all;
640 tree result, value, tree_val;
641 gcov_type prob;
642 gimple stmt;
644 stmt = gsi_stmt (*si);
645 if (gimple_code (stmt) != GIMPLE_ASSIGN)
646 return false;
648 if (!INTEGRAL_TYPE_P (TREE_TYPE (gimple_assign_lhs (stmt))))
649 return false;
651 code = gimple_assign_rhs_code (stmt);
653 if (code != TRUNC_DIV_EXPR && code != TRUNC_MOD_EXPR)
654 return false;
656 histogram = gimple_histogram_value_of_type (cfun, stmt,
657 HIST_TYPE_SINGLE_VALUE);
658 if (!histogram)
659 return false;
661 value = histogram->hvalue.value;
662 val = histogram->hvalue.counters[0];
663 count = histogram->hvalue.counters[1];
664 all = histogram->hvalue.counters[2];
665 gimple_remove_histogram_value (cfun, stmt, histogram);
667 /* We require that count is at least half of all; this means
668 that for the transformation to fire the value must be constant
669 at least 50% of time (and 75% gives the guarantee of usage). */
670 if (simple_cst_equal (gimple_assign_rhs2 (stmt), value) != 1
671 || 2 * count < all
672 || optimize_bb_for_size_p (gimple_bb (stmt)))
673 return false;
675 if (check_counter (stmt, "value", &count, &all, gimple_bb (stmt)->count))
676 return false;
678 /* Compute probability of taking the optimal path. */
679 if (all > 0)
680 prob = (count * REG_BR_PROB_BASE + all / 2) / all;
681 else
682 prob = 0;
684 tree_val = build_int_cst_wide (get_gcov_type (),
685 (unsigned HOST_WIDE_INT) val,
686 val >> (HOST_BITS_PER_WIDE_INT - 1) >> 1);
687 result = gimple_divmod_fixed_value (stmt, tree_val, prob, count, all);
689 if (dump_file)
691 fprintf (dump_file, "Div/mod by constant ");
692 print_generic_expr (dump_file, value, TDF_SLIM);
693 fprintf (dump_file, "=");
694 print_generic_expr (dump_file, tree_val, TDF_SLIM);
695 fprintf (dump_file, " transformation on insn ");
696 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
699 gimple_assign_set_rhs_from_tree (si, result);
701 return true;
704 /* Generate code for transformation 2 (with parent gimple assign STMT and
705 probability of taking the optimal path PROB, which is equivalent to COUNT/ALL
706 within roundoff error). This generates the result into a temp and returns
707 the temp; it does not replace or alter the original STMT. */
708 static tree
709 gimple_mod_pow2 (gimple stmt, int prob, gcov_type count, gcov_type all)
711 gimple stmt1, stmt2, stmt3, stmt4;
712 tree tmp2, tmp3;
713 gimple bb1end, bb2end, bb3end;
714 basic_block bb, bb2, bb3, bb4;
715 tree optype, op1, op2;
716 edge e12, e13, e23, e24, e34;
717 gimple_stmt_iterator gsi;
718 tree result;
720 gcc_assert (is_gimple_assign (stmt)
721 && gimple_assign_rhs_code (stmt) == TRUNC_MOD_EXPR);
723 optype = TREE_TYPE (gimple_assign_lhs (stmt));
724 op1 = gimple_assign_rhs1 (stmt);
725 op2 = gimple_assign_rhs2 (stmt);
727 bb = gimple_bb (stmt);
728 gsi = gsi_for_stmt (stmt);
730 result = create_tmp_var (optype, "PROF");
731 tmp2 = create_tmp_var (optype, "PROF");
732 tmp3 = create_tmp_var (optype, "PROF");
733 stmt2 = gimple_build_assign_with_ops (PLUS_EXPR, tmp2, op2,
734 build_int_cst (optype, -1));
735 stmt3 = gimple_build_assign_with_ops (BIT_AND_EXPR, tmp3, tmp2, op2);
736 stmt4 = gimple_build_cond (NE_EXPR, tmp3, build_int_cst (optype, 0),
737 NULL_TREE, NULL_TREE);
738 gsi_insert_before (&gsi, stmt2, GSI_SAME_STMT);
739 gsi_insert_before (&gsi, stmt3, GSI_SAME_STMT);
740 gsi_insert_before (&gsi, stmt4, GSI_SAME_STMT);
741 bb1end = stmt4;
743 /* tmp2 == op2-1 inherited from previous block. */
744 stmt1 = gimple_build_assign_with_ops (BIT_AND_EXPR, result, op1, tmp2);
745 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
746 bb2end = stmt1;
748 stmt1 = gimple_build_assign_with_ops (gimple_assign_rhs_code (stmt), result,
749 op1, op2);
750 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
751 bb3end = stmt1;
753 /* Fix CFG. */
754 /* Edge e23 connects bb2 to bb3, etc. */
755 e12 = split_block (bb, bb1end);
756 bb2 = e12->dest;
757 bb2->count = count;
758 e23 = split_block (bb2, bb2end);
759 bb3 = e23->dest;
760 bb3->count = all - count;
761 e34 = split_block (bb3, bb3end);
762 bb4 = e34->dest;
763 bb4->count = all;
765 e12->flags &= ~EDGE_FALLTHRU;
766 e12->flags |= EDGE_FALSE_VALUE;
767 e12->probability = prob;
768 e12->count = count;
770 e13 = make_edge (bb, bb3, EDGE_TRUE_VALUE);
771 e13->probability = REG_BR_PROB_BASE - prob;
772 e13->count = all - count;
774 remove_edge (e23);
776 e24 = make_edge (bb2, bb4, EDGE_FALLTHRU);
777 e24->probability = REG_BR_PROB_BASE;
778 e24->count = count;
780 e34->probability = REG_BR_PROB_BASE;
781 e34->count = all - count;
783 return result;
786 /* Do transform 2) on INSN if applicable. */
787 static bool
788 gimple_mod_pow2_value_transform (gimple_stmt_iterator *si)
790 histogram_value histogram;
791 enum tree_code code;
792 gcov_type count, wrong_values, all;
793 tree lhs_type, result, value;
794 gcov_type prob;
795 gimple stmt;
797 stmt = gsi_stmt (*si);
798 if (gimple_code (stmt) != GIMPLE_ASSIGN)
799 return false;
801 lhs_type = TREE_TYPE (gimple_assign_lhs (stmt));
802 if (!INTEGRAL_TYPE_P (lhs_type))
803 return false;
805 code = gimple_assign_rhs_code (stmt);
807 if (code != TRUNC_MOD_EXPR || !TYPE_UNSIGNED (lhs_type))
808 return false;
810 histogram = gimple_histogram_value_of_type (cfun, stmt, HIST_TYPE_POW2);
811 if (!histogram)
812 return false;
814 value = histogram->hvalue.value;
815 wrong_values = histogram->hvalue.counters[0];
816 count = histogram->hvalue.counters[1];
818 gimple_remove_histogram_value (cfun, stmt, histogram);
820 /* We require that we hit a power of 2 at least half of all evaluations. */
821 if (simple_cst_equal (gimple_assign_rhs2 (stmt), value) != 1
822 || count < wrong_values
823 || optimize_bb_for_size_p (gimple_bb (stmt)))
824 return false;
826 if (dump_file)
828 fprintf (dump_file, "Mod power of 2 transformation on insn ");
829 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
832 /* Compute probability of taking the optimal path. */
833 all = count + wrong_values;
835 if (check_counter (stmt, "pow2", &count, &all, gimple_bb (stmt)->count))
836 return false;
838 if (all > 0)
839 prob = (count * REG_BR_PROB_BASE + all / 2) / all;
840 else
841 prob = 0;
843 result = gimple_mod_pow2 (stmt, prob, count, all);
845 gimple_assign_set_rhs_from_tree (si, result);
847 return true;
850 /* Generate code for transformations 3 and 4 (with parent gimple assign STMT, and
851 NCOUNTS the number of cases to support. Currently only NCOUNTS==0 or 1 is
852 supported and this is built into this interface. The probabilities of taking
853 the optimal paths are PROB1 and PROB2, which are equivalent to COUNT1/ALL and
854 COUNT2/ALL respectively within roundoff error). This generates the
855 result into a temp and returns the temp; it does not replace or alter
856 the original STMT. */
857 /* FIXME: Generalize the interface to handle NCOUNTS > 1. */
859 static tree
860 gimple_mod_subtract (gimple stmt, int prob1, int prob2, int ncounts,
861 gcov_type count1, gcov_type count2, gcov_type all)
863 gimple stmt1, stmt2, stmt3;
864 tree tmp1;
865 gimple bb1end, bb2end = NULL, bb3end;
866 basic_block bb, bb2, bb3, bb4;
867 tree optype, op1, op2;
868 edge e12, e23 = 0, e24, e34, e14;
869 gimple_stmt_iterator gsi;
870 tree result;
872 gcc_assert (is_gimple_assign (stmt)
873 && gimple_assign_rhs_code (stmt) == TRUNC_MOD_EXPR);
875 optype = TREE_TYPE (gimple_assign_lhs (stmt));
876 op1 = gimple_assign_rhs1 (stmt);
877 op2 = gimple_assign_rhs2 (stmt);
879 bb = gimple_bb (stmt);
880 gsi = gsi_for_stmt (stmt);
882 result = create_tmp_var (optype, "PROF");
883 tmp1 = create_tmp_var (optype, "PROF");
884 stmt1 = gimple_build_assign (result, op1);
885 stmt2 = gimple_build_assign (tmp1, op2);
886 stmt3 = gimple_build_cond (LT_EXPR, result, tmp1, NULL_TREE, NULL_TREE);
887 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
888 gsi_insert_before (&gsi, stmt2, GSI_SAME_STMT);
889 gsi_insert_before (&gsi, stmt3, GSI_SAME_STMT);
890 bb1end = stmt3;
892 if (ncounts) /* Assumed to be 0 or 1 */
894 stmt1 = gimple_build_assign_with_ops (MINUS_EXPR, result, result, tmp1);
895 stmt2 = gimple_build_cond (LT_EXPR, result, tmp1, NULL_TREE, NULL_TREE);
896 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
897 gsi_insert_before (&gsi, stmt2, GSI_SAME_STMT);
898 bb2end = stmt2;
901 /* Fallback case. */
902 stmt1 = gimple_build_assign_with_ops (gimple_assign_rhs_code (stmt), result,
903 result, tmp1);
904 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
905 bb3end = stmt1;
907 /* Fix CFG. */
908 /* Edge e23 connects bb2 to bb3, etc. */
909 /* However block 3 is optional; if it is not there, references
910 to 3 really refer to block 2. */
911 e12 = split_block (bb, bb1end);
912 bb2 = e12->dest;
913 bb2->count = all - count1;
915 if (ncounts) /* Assumed to be 0 or 1. */
917 e23 = split_block (bb2, bb2end);
918 bb3 = e23->dest;
919 bb3->count = all - count1 - count2;
922 e34 = split_block (ncounts ? bb3 : bb2, bb3end);
923 bb4 = e34->dest;
924 bb4->count = all;
926 e12->flags &= ~EDGE_FALLTHRU;
927 e12->flags |= EDGE_FALSE_VALUE;
928 e12->probability = REG_BR_PROB_BASE - prob1;
929 e12->count = all - count1;
931 e14 = make_edge (bb, bb4, EDGE_TRUE_VALUE);
932 e14->probability = prob1;
933 e14->count = count1;
935 if (ncounts) /* Assumed to be 0 or 1. */
937 e23->flags &= ~EDGE_FALLTHRU;
938 e23->flags |= EDGE_FALSE_VALUE;
939 e23->count = all - count1 - count2;
940 e23->probability = REG_BR_PROB_BASE - prob2;
942 e24 = make_edge (bb2, bb4, EDGE_TRUE_VALUE);
943 e24->probability = prob2;
944 e24->count = count2;
947 e34->probability = REG_BR_PROB_BASE;
948 e34->count = all - count1 - count2;
950 return result;
954 /* Do transforms 3) and 4) on the statement pointed-to by SI if applicable. */
956 static bool
957 gimple_mod_subtract_transform (gimple_stmt_iterator *si)
959 histogram_value histogram;
960 enum tree_code code;
961 gcov_type count, wrong_values, all;
962 tree lhs_type, result, value;
963 gcov_type prob1, prob2;
964 unsigned int i, steps;
965 gcov_type count1, count2;
966 gimple stmt;
968 stmt = gsi_stmt (*si);
969 if (gimple_code (stmt) != GIMPLE_ASSIGN)
970 return false;
972 lhs_type = TREE_TYPE (gimple_assign_lhs (stmt));
973 if (!INTEGRAL_TYPE_P (lhs_type))
974 return false;
976 code = gimple_assign_rhs_code (stmt);
978 if (code != TRUNC_MOD_EXPR || !TYPE_UNSIGNED (lhs_type))
979 return false;
981 histogram = gimple_histogram_value_of_type (cfun, stmt, HIST_TYPE_INTERVAL);
982 if (!histogram)
983 return false;
985 value = histogram->hvalue.value;
986 all = 0;
987 wrong_values = 0;
988 for (i = 0; i < histogram->hdata.intvl.steps; i++)
989 all += histogram->hvalue.counters[i];
991 wrong_values += histogram->hvalue.counters[i];
992 wrong_values += histogram->hvalue.counters[i+1];
993 steps = histogram->hdata.intvl.steps;
994 all += wrong_values;
995 count1 = histogram->hvalue.counters[0];
996 count2 = histogram->hvalue.counters[1];
998 /* Compute probability of taking the optimal path. */
999 if (check_counter (stmt, "interval", &count1, &all, gimple_bb (stmt)->count))
1001 gimple_remove_histogram_value (cfun, stmt, histogram);
1002 return false;
1005 if (flag_profile_correction && count1 + count2 > all)
1006 all = count1 + count2;
1008 gcc_assert (count1 + count2 <= all);
1010 /* We require that we use just subtractions in at least 50% of all
1011 evaluations. */
1012 count = 0;
1013 for (i = 0; i < histogram->hdata.intvl.steps; i++)
1015 count += histogram->hvalue.counters[i];
1016 if (count * 2 >= all)
1017 break;
1019 if (i == steps
1020 || optimize_bb_for_size_p (gimple_bb (stmt)))
1021 return false;
1023 gimple_remove_histogram_value (cfun, stmt, histogram);
1024 if (dump_file)
1026 fprintf (dump_file, "Mod subtract transformation on insn ");
1027 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1030 /* Compute probability of taking the optimal path(s). */
1031 if (all > 0)
1033 prob1 = (count1 * REG_BR_PROB_BASE + all / 2) / all;
1034 prob2 = (count2 * REG_BR_PROB_BASE + all / 2) / all;
1036 else
1038 prob1 = prob2 = 0;
1041 /* In practice, "steps" is always 2. This interface reflects this,
1042 and will need to be changed if "steps" can change. */
1043 result = gimple_mod_subtract (stmt, prob1, prob2, i, count1, count2, all);
1045 gimple_assign_set_rhs_from_tree (si, result);
1047 return true;
1050 static struct cgraph_node** pid_map = NULL;
1052 /* Initialize map of pids (pid -> cgraph node) */
1054 static void
1055 init_pid_map (void)
1057 struct cgraph_node *n;
1059 if (pid_map != NULL)
1060 return;
1062 pid_map = XCNEWVEC (struct cgraph_node*, cgraph_max_pid);
1064 for (n = cgraph_nodes; n; n = n->next)
1066 if (n->pid != -1)
1067 pid_map [n->pid] = n;
1071 /* Return cgraph node for function with pid */
1073 static inline struct cgraph_node*
1074 find_func_by_pid (int pid)
1076 init_pid_map ();
1078 return pid_map [pid];
1081 /* Do transformation
1083 if (actual_callee_address == address_of_most_common_function/method)
1084 do direct call
1085 else
1086 old call
1089 static gimple
1090 gimple_ic (gimple stmt, gimple call, struct cgraph_node *direct_call,
1091 int prob, gcov_type count, gcov_type all)
1093 gimple stmt1, stmt2, stmt3;
1094 tree tmp1, tmpv, tmp;
1095 gimple bb1end, bb2end, bb3end;
1096 basic_block bb, bb2, bb3, bb4;
1097 tree optype = build_pointer_type (void_type_node);
1098 edge e12, e13, e23, e24, e34;
1099 gimple_stmt_iterator gsi;
1100 int region;
1102 bb = gimple_bb (stmt);
1103 gsi = gsi_for_stmt (stmt);
1105 tmpv = create_tmp_var (optype, "PROF");
1106 tmp1 = create_tmp_var (optype, "PROF");
1107 stmt1 = gimple_build_assign (tmpv, unshare_expr (gimple_call_fn (call)));
1109 tmp = fold_convert (optype, build_addr (direct_call->decl,
1110 current_function_decl));
1111 stmt2 = gimple_build_assign (tmp1, tmp);
1112 stmt3 = gimple_build_cond (NE_EXPR, tmp1, tmpv, NULL_TREE, NULL_TREE);
1113 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
1114 gsi_insert_before (&gsi, stmt2, GSI_SAME_STMT);
1115 gsi_insert_before (&gsi, stmt3, GSI_SAME_STMT);
1116 bb1end = stmt3;
1118 stmt1 = gimple_copy (stmt);
1119 gimple_call_set_fndecl (stmt1, direct_call->decl);
1120 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
1121 bb2end = stmt1;
1122 bb3end = stmt;
1124 /* Fix CFG. */
1125 /* Edge e23 connects bb2 to bb3, etc. */
1126 e12 = split_block (bb, bb1end);
1127 bb2 = e12->dest;
1128 bb2->count = count;
1129 e23 = split_block (bb2, bb2end);
1130 bb3 = e23->dest;
1131 bb3->count = all - count;
1132 e34 = split_block (bb3, bb3end);
1133 bb4 = e34->dest;
1134 bb4->count = all;
1136 e12->flags &= ~EDGE_FALLTHRU;
1137 e12->flags |= EDGE_FALSE_VALUE;
1138 e12->probability = prob;
1139 e12->count = count;
1141 e13 = make_edge (bb, bb3, EDGE_TRUE_VALUE);
1142 e13->probability = REG_BR_PROB_BASE - prob;
1143 e13->count = all - count;
1145 remove_edge (e23);
1147 e24 = make_edge (bb2, bb4, EDGE_FALLTHRU);
1148 e24->probability = REG_BR_PROB_BASE;
1149 e24->count = count;
1150 e34->probability = REG_BR_PROB_BASE;
1151 e34->count = all - count;
1153 /* Fix eh edges */
1154 region = lookup_stmt_eh_region (stmt);
1155 if (region >= 0 && stmt_could_throw_p (stmt1))
1157 add_stmt_to_eh_region (stmt1, region);
1158 make_eh_edges (stmt1);
1161 if (region >= 0 && stmt_could_throw_p (stmt))
1163 gimple_purge_dead_eh_edges (bb4);
1164 make_eh_edges (stmt);
1167 return stmt1;
1171 For every checked indirect/virtual call determine if most common pid of
1172 function/class method has probability more than 50%. If yes modify code of
1173 this call to:
1176 static bool
1177 gimple_ic_transform (gimple stmt)
1179 histogram_value histogram;
1180 gcov_type val, count, all, bb_all;
1181 gcov_type prob;
1182 tree callee;
1183 gimple modify;
1184 struct cgraph_node *direct_call;
1186 if (gimple_code (stmt) != GIMPLE_CALL)
1187 return false;
1189 callee = gimple_call_fn (stmt);
1191 if (TREE_CODE (callee) == FUNCTION_DECL)
1192 return false;
1194 histogram = gimple_histogram_value_of_type (cfun, stmt, HIST_TYPE_INDIR_CALL);
1195 if (!histogram)
1196 return false;
1198 val = histogram->hvalue.counters [0];
1199 count = histogram->hvalue.counters [1];
1200 all = histogram->hvalue.counters [2];
1201 gimple_remove_histogram_value (cfun, stmt, histogram);
1203 if (4 * count <= 3 * all)
1204 return false;
1206 bb_all = gimple_bb (stmt)->count;
1207 /* The order of CHECK_COUNTER calls is important -
1208 since check_counter can correct the third parameter
1209 and we want to make count <= all <= bb_all. */
1210 if ( check_counter (stmt, "ic", &all, &bb_all, bb_all)
1211 || check_counter (stmt, "ic", &count, &all, all))
1212 return false;
1214 if (all > 0)
1215 prob = (count * REG_BR_PROB_BASE + all / 2) / all;
1216 else
1217 prob = 0;
1218 direct_call = find_func_by_pid ((int)val);
1220 if (direct_call == NULL)
1221 return false;
1223 modify = gimple_ic (stmt, stmt, direct_call, prob, count, all);
1225 if (dump_file)
1227 fprintf (dump_file, "Indirect call -> direct call ");
1228 print_generic_expr (dump_file, gimple_call_fn (stmt), TDF_SLIM);
1229 fprintf (dump_file, "=> ");
1230 print_generic_expr (dump_file, direct_call->decl, TDF_SLIM);
1231 fprintf (dump_file, " transformation on insn ");
1232 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1233 fprintf (dump_file, " to ");
1234 print_gimple_stmt (dump_file, modify, 0, TDF_SLIM);
1235 fprintf (dump_file, "hist->count "HOST_WIDEST_INT_PRINT_DEC
1236 " hist->all "HOST_WIDEST_INT_PRINT_DEC"\n", count, all);
1239 return true;
1242 /* Return true if the stringop CALL with FNDECL shall be profiled. */
1243 static bool
1244 interesting_stringop_to_profile_p (tree fndecl, gimple call)
1246 enum built_in_function fcode = DECL_FUNCTION_CODE (fndecl);
1248 if (fcode != BUILT_IN_MEMCPY && fcode != BUILT_IN_MEMPCPY
1249 && fcode != BUILT_IN_MEMSET && fcode != BUILT_IN_BZERO)
1250 return false;
1252 switch (fcode)
1254 case BUILT_IN_MEMCPY:
1255 case BUILT_IN_MEMPCPY:
1256 return validate_gimple_arglist (call, POINTER_TYPE, POINTER_TYPE,
1257 INTEGER_TYPE, VOID_TYPE);
1258 case BUILT_IN_MEMSET:
1259 return validate_gimple_arglist (call, POINTER_TYPE, INTEGER_TYPE,
1260 INTEGER_TYPE, VOID_TYPE);
1261 case BUILT_IN_BZERO:
1262 return validate_gimple_arglist (call, POINTER_TYPE, INTEGER_TYPE,
1263 VOID_TYPE);
1264 default:
1265 gcc_unreachable ();
1269 /* Convert stringop (..., size)
1270 into
1271 if (size == VALUE)
1272 stringop (...., VALUE);
1273 else
1274 stringop (...., size);
1275 assuming constant propagation of VALUE will happen later.
1277 static void
1278 gimple_stringop_fixed_value (gimple stmt, tree value, int prob, gcov_type count,
1279 gcov_type all)
1281 gimple stmt1, stmt2, stmt3;
1282 tree tmp1, tmpv;
1283 gimple bb1end, bb2end;
1284 basic_block bb, bb2, bb3, bb4;
1285 edge e12, e13, e23, e24, e34;
1286 gimple_stmt_iterator gsi;
1287 tree blck_size = gimple_call_arg (stmt, 2);
1288 tree optype = TREE_TYPE (blck_size);
1289 int region;
1291 bb = gimple_bb (stmt);
1292 gsi = gsi_for_stmt (stmt);
1294 if (gsi_end_p (gsi))
1296 edge_iterator ei;
1297 for (ei = ei_start (bb->succs); (e34 = ei_safe_edge (ei)); )
1298 if (!(e34->flags & EDGE_ABNORMAL))
1299 break;
1301 else
1303 e34 = split_block (bb, stmt);
1304 gsi = gsi_for_stmt (stmt);
1306 bb4 = e34->dest;
1308 tmpv = create_tmp_var (optype, "PROF");
1309 tmp1 = create_tmp_var (optype, "PROF");
1310 stmt1 = gimple_build_assign (tmpv, fold_convert (optype, value));
1311 stmt2 = gimple_build_assign (tmp1, blck_size);
1312 stmt3 = gimple_build_cond (NE_EXPR, tmp1, tmpv, NULL_TREE, NULL_TREE);
1313 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
1314 gsi_insert_before (&gsi, stmt2, GSI_SAME_STMT);
1315 gsi_insert_before (&gsi, stmt3, GSI_SAME_STMT);
1316 bb1end = stmt3;
1318 stmt1 = gimple_copy (stmt);
1319 gimple_call_set_arg (stmt1, 2, value);
1320 gsi_insert_before (&gsi, stmt1, GSI_SAME_STMT);
1321 region = lookup_stmt_eh_region (stmt);
1322 if (region >= 0)
1323 add_stmt_to_eh_region (stmt1, region);
1324 bb2end = stmt1;
1326 /* Fix CFG. */
1327 /* Edge e23 connects bb2 to bb3, etc. */
1328 e12 = split_block (bb, bb1end);
1329 bb2 = e12->dest;
1330 bb2->count = count;
1331 e23 = split_block (bb2, bb2end);
1332 bb3 = e23->dest;
1333 bb3->count = all - count;
1335 e12->flags &= ~EDGE_FALLTHRU;
1336 e12->flags |= EDGE_FALSE_VALUE;
1337 e12->probability = prob;
1338 e12->count = count;
1340 e13 = make_edge (bb, bb3, EDGE_TRUE_VALUE);
1341 e13->probability = REG_BR_PROB_BASE - prob;
1342 e13->count = all - count;
1344 remove_edge (e23);
1346 e24 = make_edge (bb2, bb4, EDGE_FALLTHRU);
1347 e24->probability = REG_BR_PROB_BASE;
1348 e24->count = count;
1350 e34->probability = REG_BR_PROB_BASE;
1351 e34->count = all - count;
1354 /* Find values inside STMT for that we want to measure histograms for
1355 division/modulo optimization. */
1356 static bool
1357 gimple_stringops_transform (gimple_stmt_iterator *gsi)
1359 gimple stmt = gsi_stmt (*gsi);
1360 tree fndecl;
1361 tree blck_size;
1362 enum built_in_function fcode;
1363 histogram_value histogram;
1364 gcov_type count, all, val;
1365 tree value;
1366 tree dest, src;
1367 unsigned int dest_align, src_align;
1368 gcov_type prob;
1369 tree tree_val;
1371 if (gimple_code (stmt) != GIMPLE_CALL)
1372 return false;
1373 fndecl = gimple_call_fndecl (stmt);
1374 if (!fndecl)
1375 return false;
1376 fcode = DECL_FUNCTION_CODE (fndecl);
1377 if (!interesting_stringop_to_profile_p (fndecl, stmt))
1378 return false;
1380 if (fcode == BUILT_IN_BZERO)
1381 blck_size = gimple_call_arg (stmt, 1);
1382 else
1383 blck_size = gimple_call_arg (stmt, 2);
1384 if (TREE_CODE (blck_size) == INTEGER_CST)
1385 return false;
1387 histogram = gimple_histogram_value_of_type (cfun, stmt, HIST_TYPE_SINGLE_VALUE);
1388 if (!histogram)
1389 return false;
1390 value = histogram->hvalue.value;
1391 val = histogram->hvalue.counters[0];
1392 count = histogram->hvalue.counters[1];
1393 all = histogram->hvalue.counters[2];
1394 gimple_remove_histogram_value (cfun, stmt, histogram);
1395 /* We require that count is at least half of all; this means
1396 that for the transformation to fire the value must be constant
1397 at least 80% of time. */
1398 if ((6 * count / 5) < all || optimize_bb_for_size_p (gimple_bb (stmt)))
1399 return false;
1400 if (check_counter (stmt, "value", &count, &all, gimple_bb (stmt)->count))
1401 return false;
1402 if (all > 0)
1403 prob = (count * REG_BR_PROB_BASE + all / 2) / all;
1404 else
1405 prob = 0;
1406 dest = gimple_call_arg (stmt, 0);
1407 dest_align = get_pointer_alignment (dest, BIGGEST_ALIGNMENT);
1408 switch (fcode)
1410 case BUILT_IN_MEMCPY:
1411 case BUILT_IN_MEMPCPY:
1412 src = gimple_call_arg (stmt, 1);
1413 src_align = get_pointer_alignment (src, BIGGEST_ALIGNMENT);
1414 if (!can_move_by_pieces (val, MIN (dest_align, src_align)))
1415 return false;
1416 break;
1417 case BUILT_IN_MEMSET:
1418 if (!can_store_by_pieces (val, builtin_memset_read_str,
1419 gimple_call_arg (stmt, 1),
1420 dest_align, true))
1421 return false;
1422 break;
1423 case BUILT_IN_BZERO:
1424 if (!can_store_by_pieces (val, builtin_memset_read_str,
1425 integer_zero_node,
1426 dest_align, true))
1427 return false;
1428 break;
1429 default:
1430 gcc_unreachable ();
1432 tree_val = build_int_cst_wide (get_gcov_type (),
1433 (unsigned HOST_WIDE_INT) val,
1434 val >> (HOST_BITS_PER_WIDE_INT - 1) >> 1);
1435 if (dump_file)
1437 fprintf (dump_file, "Single value %i stringop transformation on ",
1438 (int)val);
1439 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1441 gimple_stringop_fixed_value (stmt, tree_val, prob, count, all);
1443 return true;
1446 void
1447 stringop_block_profile (gimple stmt, unsigned int *expected_align,
1448 HOST_WIDE_INT *expected_size)
1450 histogram_value histogram;
1451 histogram = gimple_histogram_value_of_type (cfun, stmt, HIST_TYPE_AVERAGE);
1452 if (!histogram)
1453 *expected_size = -1;
1454 else if (!histogram->hvalue.counters[1])
1456 *expected_size = -1;
1457 gimple_remove_histogram_value (cfun, stmt, histogram);
1459 else
1461 gcov_type size;
1462 size = ((histogram->hvalue.counters[0]
1463 + histogram->hvalue.counters[1] / 2)
1464 / histogram->hvalue.counters[1]);
1465 /* Even if we can hold bigger value in SIZE, INT_MAX
1466 is safe "infinity" for code generation strategies. */
1467 if (size > INT_MAX)
1468 size = INT_MAX;
1469 *expected_size = size;
1470 gimple_remove_histogram_value (cfun, stmt, histogram);
1472 histogram = gimple_histogram_value_of_type (cfun, stmt, HIST_TYPE_IOR);
1473 if (!histogram)
1474 *expected_align = 0;
1475 else if (!histogram->hvalue.counters[0])
1477 gimple_remove_histogram_value (cfun, stmt, histogram);
1478 *expected_align = 0;
1480 else
1482 gcov_type count;
1483 int alignment;
1485 count = histogram->hvalue.counters[0];
1486 alignment = 1;
1487 while (!(count & alignment)
1488 && (alignment * 2 * BITS_PER_UNIT))
1489 alignment <<= 1;
1490 *expected_align = alignment * BITS_PER_UNIT;
1491 gimple_remove_histogram_value (cfun, stmt, histogram);
1495 struct value_prof_hooks {
1496 /* Find list of values for which we want to measure histograms. */
1497 void (*find_values_to_profile) (histogram_values *);
1499 /* Identify and exploit properties of values that are hard to analyze
1500 statically. See value-prof.c for more detail. */
1501 bool (*value_profile_transformations) (void);
1504 /* Find values inside STMT for that we want to measure histograms for
1505 division/modulo optimization. */
1506 static void
1507 gimple_divmod_values_to_profile (gimple stmt, histogram_values *values)
1509 tree lhs, divisor, op0, type;
1510 histogram_value hist;
1512 if (gimple_code (stmt) != GIMPLE_ASSIGN)
1513 return;
1515 lhs = gimple_assign_lhs (stmt);
1516 type = TREE_TYPE (lhs);
1517 if (!INTEGRAL_TYPE_P (type))
1518 return;
1520 switch (gimple_assign_rhs_code (stmt))
1522 case TRUNC_DIV_EXPR:
1523 case TRUNC_MOD_EXPR:
1524 divisor = gimple_assign_rhs2 (stmt);
1525 op0 = gimple_assign_rhs1 (stmt);
1527 VEC_reserve (histogram_value, heap, *values, 3);
1529 if (is_gimple_reg (divisor))
1530 /* Check for the case where the divisor is the same value most
1531 of the time. */
1532 VEC_quick_push (histogram_value, *values,
1533 gimple_alloc_histogram_value (cfun,
1534 HIST_TYPE_SINGLE_VALUE,
1535 stmt, divisor));
1537 /* For mod, check whether it is not often a noop (or replaceable by
1538 a few subtractions). */
1539 if (gimple_assign_rhs_code (stmt) == TRUNC_MOD_EXPR
1540 && TYPE_UNSIGNED (type))
1542 tree val;
1543 /* Check for a special case where the divisor is power of 2. */
1544 VEC_quick_push (histogram_value, *values,
1545 gimple_alloc_histogram_value (cfun, HIST_TYPE_POW2,
1546 stmt, divisor));
1548 val = build2 (TRUNC_DIV_EXPR, type, op0, divisor);
1549 hist = gimple_alloc_histogram_value (cfun, HIST_TYPE_INTERVAL,
1550 stmt, val);
1551 hist->hdata.intvl.int_start = 0;
1552 hist->hdata.intvl.steps = 2;
1553 VEC_quick_push (histogram_value, *values, hist);
1555 return;
1557 default:
1558 return;
1562 /* Find calls inside STMT for that we want to measure histograms for
1563 indirect/virtual call optimization. */
1565 static void
1566 gimple_indirect_call_to_profile (gimple stmt, histogram_values *values)
1568 tree callee;
1570 if (gimple_code (stmt) != GIMPLE_CALL
1571 || gimple_call_fndecl (stmt) != NULL_TREE)
1572 return;
1574 callee = gimple_call_fn (stmt);
1576 VEC_reserve (histogram_value, heap, *values, 3);
1578 VEC_quick_push (histogram_value, *values,
1579 gimple_alloc_histogram_value (cfun, HIST_TYPE_INDIR_CALL,
1580 stmt, callee));
1582 return;
1585 /* Find values inside STMT for that we want to measure histograms for
1586 string operations. */
1587 static void
1588 gimple_stringops_values_to_profile (gimple stmt, histogram_values *values)
1590 tree fndecl;
1591 tree blck_size;
1592 tree dest;
1593 enum built_in_function fcode;
1595 if (gimple_code (stmt) != GIMPLE_CALL)
1596 return;
1597 fndecl = gimple_call_fndecl (stmt);
1598 if (!fndecl)
1599 return;
1600 fcode = DECL_FUNCTION_CODE (fndecl);
1602 if (!interesting_stringop_to_profile_p (fndecl, stmt))
1603 return;
1605 dest = gimple_call_arg (stmt, 0);
1606 if (fcode == BUILT_IN_BZERO)
1607 blck_size = gimple_call_arg (stmt, 1);
1608 else
1609 blck_size = gimple_call_arg (stmt, 2);
1611 if (TREE_CODE (blck_size) != INTEGER_CST)
1613 VEC_safe_push (histogram_value, heap, *values,
1614 gimple_alloc_histogram_value (cfun, HIST_TYPE_SINGLE_VALUE,
1615 stmt, blck_size));
1616 VEC_safe_push (histogram_value, heap, *values,
1617 gimple_alloc_histogram_value (cfun, HIST_TYPE_AVERAGE,
1618 stmt, blck_size));
1620 if (TREE_CODE (blck_size) != INTEGER_CST)
1621 VEC_safe_push (histogram_value, heap, *values,
1622 gimple_alloc_histogram_value (cfun, HIST_TYPE_IOR,
1623 stmt, dest));
1626 /* Find values inside STMT for that we want to measure histograms and adds
1627 them to list VALUES. */
1629 static void
1630 gimple_values_to_profile (gimple stmt, histogram_values *values)
1632 if (flag_value_profile_transformations)
1634 gimple_divmod_values_to_profile (stmt, values);
1635 gimple_stringops_values_to_profile (stmt, values);
1636 gimple_indirect_call_to_profile (stmt, values);
1640 static void
1641 gimple_find_values_to_profile (histogram_values *values)
1643 basic_block bb;
1644 gimple_stmt_iterator gsi;
1645 unsigned i;
1646 histogram_value hist = NULL;
1648 *values = NULL;
1649 FOR_EACH_BB (bb)
1650 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1651 gimple_values_to_profile (gsi_stmt (gsi), values);
1653 for (i = 0; VEC_iterate (histogram_value, *values, i, hist); i++)
1655 switch (hist->type)
1657 case HIST_TYPE_INTERVAL:
1658 hist->n_counters = hist->hdata.intvl.steps + 2;
1659 break;
1661 case HIST_TYPE_POW2:
1662 hist->n_counters = 2;
1663 break;
1665 case HIST_TYPE_SINGLE_VALUE:
1666 hist->n_counters = 3;
1667 break;
1669 case HIST_TYPE_CONST_DELTA:
1670 hist->n_counters = 4;
1671 break;
1673 case HIST_TYPE_INDIR_CALL:
1674 hist->n_counters = 3;
1675 break;
1677 case HIST_TYPE_AVERAGE:
1678 hist->n_counters = 2;
1679 break;
1681 case HIST_TYPE_IOR:
1682 hist->n_counters = 1;
1683 break;
1685 default:
1686 gcc_unreachable ();
1688 if (dump_file)
1690 fprintf (dump_file, "Stmt ");
1691 print_gimple_stmt (dump_file, hist->hvalue.stmt, 0, TDF_SLIM);
1692 dump_histogram_value (dump_file, hist);
1697 static struct value_prof_hooks gimple_value_prof_hooks = {
1698 gimple_find_values_to_profile,
1699 gimple_value_profile_transformations
1702 void
1703 gimple_register_value_prof_hooks (void)
1705 gcc_assert (current_ir_type () == IR_GIMPLE);
1706 value_prof_hooks = &gimple_value_prof_hooks;
1709 /* IR-independent entry points. */
1710 void
1711 find_values_to_profile (histogram_values *values)
1713 (value_prof_hooks->find_values_to_profile) (values);
1716 bool
1717 value_profile_transformations (void)
1719 return (value_prof_hooks->value_profile_transformations) ();