gcc/ipa-inline.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003-2017 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /*  Inlining decision heuristics
  22
  23     The implementation of inliner is organized as follows:
  24
  25     inlining heuristics limits
  26
  27       can_inline_edge_p allow to check that particular inlining is allowed
  28       by the limits specified by user (allowed function growth, growth and so
  29       on).
  30
  31       Functions are inlined when it is obvious the result is profitable (such
  32       as functions called once or when inlining reduce code size).
  33       In addition to that we perform inlining of small functions and recursive
  34       inlining.
  35
  36     inlining heuristics
  37
  38        The inliner itself is split into two passes:
  39
  40        pass_early_inlining
  41
  42          Simple local inlining pass inlining callees into current function.
  43          This pass makes no use of whole unit analysis and thus it can do only
  44          very simple decisions based on local properties.
  45
  46          The strength of the pass is that it is run in topological order
  47          (reverse postorder) on the callgraph. Functions are converted into SSA
  48          form just before this pass and optimized subsequently. As a result, the
  49          callees of the function seen by the early inliner was already optimized
  50          and results of early inlining adds a lot of optimization opportunities
  51          for the local optimization.
  52
  53          The pass handle the obvious inlining decisions within the compilation
  54          unit - inlining auto inline functions, inlining for size and
  55          flattening.
  56
  57          main strength of the pass is the ability to eliminate abstraction
  58          penalty in C++ code (via combination of inlining and early
  59          optimization) and thus improve quality of analysis done by real IPA
  60          optimizers.
  61
  62          Because of lack of whole unit knowledge, the pass can not really make
  63          good code size/performance tradeoffs.  It however does very simple
  64          speculative inlining allowing code size to grow by
  65          EARLY_INLINING_INSNS when callee is leaf function.  In this case the
  66          optimizations performed later are very likely to eliminate the cost.
  67
  68        pass_ipa_inline
  69
  70          This is the real inliner able to handle inlining with whole program
  71          knowledge. It performs following steps:
  72
  73          1) inlining of small functions.  This is implemented by greedy
  74          algorithm ordering all inlinable cgraph edges by their badness and
  75          inlining them in this order as long as inline limits allows doing so.
  76
  77          This heuristics is not very good on inlining recursive calls. Recursive
  78          calls can be inlined with results similar to loop unrolling. To do so,
  79          special purpose recursive inliner is executed on function when
  80          recursive edge is met as viable candidate.
  81
  82          2) Unreachable functions are removed from callgraph.  Inlining leads
  83          to devirtualization and other modification of callgraph so functions
  84          may become unreachable during the process. Also functions declared as
  85          extern inline or virtual functions are removed, since after inlining
  86          we no longer need the offline bodies.
  87
  88          3) Functions called once and not exported from the unit are inlined.
  89          This should almost always lead to reduction of code size by eliminating
  90          the need for offline copy of the function.  */
  91
  92 #include "config.h"
  93 #include "system.h"
  94 #include "coretypes.h"
  95 #include "backend.h"
  96 #include "target.h"
  97 #include "rtl.h"
  98 #include "tree.h"
  99 #include "gimple.h"
 100 #include "alloc-pool.h"
 101 #include "tree-pass.h"
 102 #include "gimple-ssa.h"
 103 #include "cgraph.h"
 104 #include "lto-streamer.h"
 105 #include "trans-mem.h"
 106 #include "calls.h"
 107 #include "tree-inline.h"
 108 #include "params.h"
 109 #include "profile.h"
 110 #include "symbol-summary.h"
 111 #include "tree-vrp.h"
 112 #include "ipa-prop.h"
 113 #include "ipa-inline.h"
 114 #include "ipa-utils.h"
 115 #include "sreal.h"
 116 #include "auto-profile.h"
 117 #include "builtins.h"
 118 #include "fibonacci_heap.h"
 119
 120 typedef fibonacci_heap <sreal, cgraph_edge> edge_heap_t;
 121 typedef fibonacci_node <sreal, cgraph_edge> edge_heap_node_t;
 122
 123 /* Statistics we collect about inlining algorithm.  */
 124 static int overall_size;
 125 static gcov_type max_count;
 126 static gcov_type spec_rem;
 127
 128 /* Pre-computed constants 1/CGRAPH_FREQ_BASE and 1/100. */
 129 static sreal cgraph_freq_base_rec, percent_rec;
 130
 131 /* Return false when inlining edge E would lead to violating
 132    limits on function unit growth or stack usage growth.
 133
 134    The relative function body growth limit is present generally
 135    to avoid problems with non-linear behavior of the compiler.
 136    To allow inlining huge functions into tiny wrapper, the limit
 137    is always based on the bigger of the two functions considered.
 138
 139    For stack growth limits we always base the growth in stack usage
 140    of the callers.  We want to prevent applications from segfaulting
 141    on stack overflow when functions with huge stack frames gets
 142    inlined. */
 143
 144 static bool
 145 caller_growth_limits (struct cgraph_edge *e)
 146 {
 147   struct cgraph_node *to = e->caller;
 148   struct cgraph_node *what = e->callee->ultimate_alias_target ();
 149   int newsize;
 150   int limit = 0;
 151   HOST_WIDE_INT stack_size_limit = 0, inlined_stack;
 152   inline_summary *info, *what_info, *outer_info = inline_summaries->get (to);
 153
 154   /* Look for function e->caller is inlined to.  While doing
 155      so work out the largest function body on the way.  As
 156      described above, we want to base our function growth
 157      limits based on that.  Not on the self size of the
 158      outer function, not on the self size of inline code
 159      we immediately inline to.  This is the most relaxed
 160      interpretation of the rule "do not grow large functions
 161      too much in order to prevent compiler from exploding".  */
 162   while (true)
 163     {
 164       info = inline_summaries->get (to);
 165       if (limit < info->self_size)
 166         limit = info->self_size;
 167       if (stack_size_limit < info->estimated_self_stack_size)
 168         stack_size_limit = info->estimated_self_stack_size;
 169       if (to->global.inlined_to)
 170         to = to->callers->caller;
 171       else
 172         break;
 173     }
 174
 175   what_info = inline_summaries->get (what);
 176
 177   if (limit < what_info->self_size)
 178     limit = what_info->self_size;
 179
 180   limit += limit * PARAM_VALUE (PARAM_LARGE_FUNCTION_GROWTH) / 100;
 181
 182   /* Check the size after inlining against the function limits.  But allow
 183      the function to shrink if it went over the limits by forced inlining.  */
 184   newsize = estimate_size_after_inlining (to, e);
 185   if (newsize >= info->size
 186       && newsize > PARAM_VALUE (PARAM_LARGE_FUNCTION_INSNS)
 187       && newsize > limit)
 188     {
 189       e->inline_failed = CIF_LARGE_FUNCTION_GROWTH_LIMIT;
 190       return false;
 191     }
 192
 193   if (!what_info->estimated_stack_size)
 194     return true;
 195
 196   /* FIXME: Stack size limit often prevents inlining in Fortran programs
 197      due to large i/o datastructures used by the Fortran front-end.
 198      We ought to ignore this limit when we know that the edge is executed
 199      on every invocation of the caller (i.e. its call statement dominates
 200      exit block).  We do not track this information, yet.  */
 201   stack_size_limit += ((gcov_type)stack_size_limit
 202                        * PARAM_VALUE (PARAM_STACK_FRAME_GROWTH) / 100);
 203
 204   inlined_stack = (outer_info->stack_frame_offset
 205                    + outer_info->estimated_self_stack_size
 206                    + what_info->estimated_stack_size);
 207   /* Check new stack consumption with stack consumption at the place
 208      stack is used.  */
 209   if (inlined_stack > stack_size_limit
 210       /* If function already has large stack usage from sibling
 211          inline call, we can inline, too.
 212          This bit overoptimistically assume that we are good at stack
 213          packing.  */
 214       && inlined_stack > info->estimated_stack_size
 215       && inlined_stack > PARAM_VALUE (PARAM_LARGE_STACK_FRAME))
 216     {
 217       e->inline_failed = CIF_LARGE_STACK_FRAME_GROWTH_LIMIT;
 218       return false;
 219     }
 220   return true;
 221 }
 222
 223 /* Dump info about why inlining has failed.  */
 224
 225 static void
 226 report_inline_failed_reason (struct cgraph_edge *e)
 227 {
 228   if (dump_file)
 229     {
 230       fprintf (dump_file, "  not inlinable: %s/%i -> %s/%i, %s\n",
 231                xstrdup_for_dump (e->caller->name ()), e->caller->order,
 232                xstrdup_for_dump (e->callee->name ()), e->callee->order,
 233                cgraph_inline_failed_string (e->inline_failed));
 234       if ((e->inline_failed == CIF_TARGET_OPTION_MISMATCH
 235            || e->inline_failed == CIF_OPTIMIZATION_MISMATCH)
 236           && e->caller->lto_file_data
 237           && e->callee->ultimate_alias_target ()->lto_file_data)
 238         {
 239           fprintf (dump_file, "  LTO objects: %s, %s\n",
 240                    e->caller->lto_file_data->file_name,
 241                    e->callee->ultimate_alias_target ()->lto_file_data->file_name);
 242         }
 243       if (e->inline_failed == CIF_TARGET_OPTION_MISMATCH)
 244         cl_target_option_print_diff
 245          (dump_file, 2, target_opts_for_fn (e->caller->decl),
 246           target_opts_for_fn (e->callee->ultimate_alias_target ()->decl));
 247       if (e->inline_failed == CIF_OPTIMIZATION_MISMATCH)
 248         cl_optimization_print_diff
 249           (dump_file, 2, opts_for_fn (e->caller->decl),
 250            opts_for_fn (e->callee->ultimate_alias_target ()->decl));
 251     }
 252 }
 253
 254  /* Decide whether sanitizer-related attributes allow inlining. */
 255
 256 static bool
 257 sanitize_attrs_match_for_inline_p (const_tree caller, const_tree callee)
 258 {
 259   /* Don't care if sanitizer is disabled */
 260   if (!(flag_sanitize & SANITIZE_ADDRESS))
 261     return true;
 262
 263   if (!caller || !callee)
 264     return true;
 265
 266   return !!lookup_attribute ("no_sanitize_address",
 267       DECL_ATTRIBUTES (caller)) ==
 268       !!lookup_attribute ("no_sanitize_address",
 269       DECL_ATTRIBUTES (callee));
 270 }
 271
 272 /* Used for flags where it is safe to inline when caller's value is
 273    grater than callee's.  */
 274 #define check_maybe_up(flag) \
 275       (opts_for_fn (caller->decl)->x_##flag             \
 276        != opts_for_fn (callee->decl)->x_##flag          \
 277        && (!always_inline                               \
 278            || opts_for_fn (caller->decl)->x_##flag      \
 279               < opts_for_fn (callee->decl)->x_##flag))
 280 /* Used for flags where it is safe to inline when caller's value is
 281    smaller than callee's.  */
 282 #define check_maybe_down(flag) \
 283       (opts_for_fn (caller->decl)->x_##flag             \
 284        != opts_for_fn (callee->decl)->x_##flag          \
 285        && (!always_inline                               \
 286            || opts_for_fn (caller->decl)->x_##flag      \
 287               > opts_for_fn (callee->decl)->x_##flag))
 288 /* Used for flags where exact match is needed for correctness.  */
 289 #define check_match(flag) \
 290       (opts_for_fn (caller->decl)->x_##flag             \
 291        != opts_for_fn (callee->decl)->x_##flag)
 292
 293  /* Decide if we can inline the edge and possibly update
 294    inline_failed reason.
 295    We check whether inlining is possible at all and whether
 296    caller growth limits allow doing so.
 297
 298    if REPORT is true, output reason to the dump file.
 299
 300    if DISREGARD_LIMITS is true, ignore size limits.*/
 301
 302 static bool
 303 can_inline_edge_p (struct cgraph_edge *e, bool report,
 304                    bool disregard_limits = false, bool early = false)
 305 {
 306   gcc_checking_assert (e->inline_failed);
 307
 308   if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
 309     {
 310       if (report)
 311         report_inline_failed_reason (e);
 312       return false;
 313     }
 314
 315   bool inlinable = true;
 316   enum availability avail;
 317   cgraph_node *caller = e->caller->global.inlined_to
 318                         ? e->caller->global.inlined_to : e->caller;
 319   cgraph_node *callee = e->callee->ultimate_alias_target (&avail, caller);
 320   tree caller_tree = DECL_FUNCTION_SPECIFIC_OPTIMIZATION (caller->decl);
 321   tree callee_tree
 322     = callee ? DECL_FUNCTION_SPECIFIC_OPTIMIZATION (callee->decl) : NULL;
 323
 324   if (!callee->definition)
 325     {
 326       e->inline_failed = CIF_BODY_NOT_AVAILABLE;
 327       inlinable = false;
 328     }
 329   else if (callee->calls_comdat_local)
 330     {
 331       e->inline_failed = CIF_USES_COMDAT_LOCAL;
 332       inlinable = false;
 333     }
 334   else if (avail <= AVAIL_INTERPOSABLE)
 335     {
 336       e->inline_failed = CIF_OVERWRITABLE;
 337       inlinable = false;
 338     }
 339   /* All edges with call_stmt_cannot_inline_p should have inline_failed
 340      initialized to one of FINAL_ERROR reasons.  */
 341   else if (e->call_stmt_cannot_inline_p)
 342     gcc_unreachable ();
 343   /* Don't inline if the functions have different EH personalities.  */
 344   else if (DECL_FUNCTION_PERSONALITY (caller->decl)
 345            && DECL_FUNCTION_PERSONALITY (callee->decl)
 346            && (DECL_FUNCTION_PERSONALITY (caller->decl)
 347                != DECL_FUNCTION_PERSONALITY (callee->decl)))
 348     {
 349       e->inline_failed = CIF_EH_PERSONALITY;
 350       inlinable = false;
 351     }
 352   /* TM pure functions should not be inlined into non-TM_pure
 353      functions.  */
 354   else if (is_tm_pure (callee->decl) && !is_tm_pure (caller->decl))
 355     {
 356       e->inline_failed = CIF_UNSPECIFIED;
 357       inlinable = false;
 358     }
 359   /* Check compatibility of target optimization options.  */
 360   else if (!targetm.target_option.can_inline_p (caller->decl,
 361                                                 callee->decl))
 362     {
 363       e->inline_failed = CIF_TARGET_OPTION_MISMATCH;
 364       inlinable = false;
 365     }
 366   else if (!inline_summaries->get (callee)->inlinable)
 367     {
 368       e->inline_failed = CIF_FUNCTION_NOT_INLINABLE;
 369       inlinable = false;
 370     }
 371   /* Don't inline a function with mismatched sanitization attributes. */
 372   else if (!sanitize_attrs_match_for_inline_p (caller->decl, callee->decl))
 373     {
 374       e->inline_failed = CIF_ATTRIBUTE_MISMATCH;
 375       inlinable = false;
 376     }
 377   /* Check if caller growth allows the inlining.  */
 378   else if (!DECL_DISREGARD_INLINE_LIMITS (callee->decl)
 379            && !disregard_limits
 380            && !lookup_attribute ("flatten",
 381                                  DECL_ATTRIBUTES (caller->decl))
 382            && !caller_growth_limits (e))
 383     inlinable = false;
 384   /* Don't inline a function with a higher optimization level than the
 385      caller.  FIXME: this is really just tip of iceberg of handling
 386      optimization attribute.  */
 387   else if (caller_tree != callee_tree)
 388     {
 389       bool always_inline =
 390              (DECL_DISREGARD_INLINE_LIMITS (callee->decl)
 391               && lookup_attribute ("always_inline",
 392                                    DECL_ATTRIBUTES (callee->decl)));
 393       inline_summary *caller_info = inline_summaries->get (caller);
 394       inline_summary *callee_info = inline_summaries->get (callee);
 395
 396      /* Until GCC 4.9 we did not check the semantics alterning flags
 397         bellow and inline across optimization boundry.
 398         Enabling checks bellow breaks several packages by refusing
 399         to inline library always_inline functions. See PR65873.
 400         Disable the check for early inlining for now until better solution
 401         is found.  */
 402      if (always_inline && early)
 403         ;
 404       /* There are some options that change IL semantics which means
 405          we cannot inline in these cases for correctness reason.
 406          Not even for always_inline declared functions.  */
 407       /* Strictly speaking only when the callee contains signed integer
 408          math where overflow is undefined.  */
 409      else if ((check_maybe_up (flag_strict_overflow)
 410                /* this flag is set by optimize.  Allow inlining across
 411                   optimize boundary.  */
 412                && (!opt_for_fn (caller->decl, optimize)
 413                    == !opt_for_fn (callee->decl, optimize) || !always_inline))
 414               || check_match (flag_wrapv)
 415               || check_match (flag_trapv)
 416               /* When caller or callee does FP math, be sure FP codegen flags
 417                  compatible.  */
 418               || ((caller_info->fp_expressions && callee_info->fp_expressions)
 419                   && (check_maybe_up (flag_rounding_math)
 420                       || check_maybe_up (flag_trapping_math)
 421                       || check_maybe_down (flag_unsafe_math_optimizations)
 422                       || check_maybe_down (flag_finite_math_only)
 423                       || check_maybe_up (flag_signaling_nans)
 424                       || check_maybe_down (flag_cx_limited_range)
 425                       || check_maybe_up (flag_signed_zeros)
 426                       || check_maybe_down (flag_associative_math)
 427                       || check_maybe_down (flag_reciprocal_math)
 428                       || check_maybe_down (flag_fp_int_builtin_inexact)
 429                       /* Strictly speaking only when the callee contains function
 430                          calls that may end up setting errno.  */
 431                       || check_maybe_up (flag_errno_math)))
 432               /* We do not want to make code compiled with exceptions to be
 433                  brought into a non-EH function unless we know that the callee
 434                  does not throw.
 435                  This is tracked by DECL_FUNCTION_PERSONALITY.  */
 436               || (check_maybe_up (flag_non_call_exceptions)
 437                   && DECL_FUNCTION_PERSONALITY (callee->decl))
 438               || (check_maybe_up (flag_exceptions)
 439                   && DECL_FUNCTION_PERSONALITY (callee->decl))
 440               /* When devirtualization is diabled for callee, it is not safe
 441                  to inline it as we possibly mangled the type info.
 442                  Allow early inlining of always inlines.  */
 443               || (!early && check_maybe_down (flag_devirtualize)))
 444         {
 445           e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 446           inlinable = false;
 447         }
 448       /* gcc.dg/pr43564.c.  Apply user-forced inline even at -O0.  */
 449       else if (always_inline)
 450         ;
 451       /* When user added an attribute to the callee honor it.  */
 452       else if (lookup_attribute ("optimize", DECL_ATTRIBUTES (callee->decl))
 453                && opts_for_fn (caller->decl) != opts_for_fn (callee->decl))
 454         {
 455           e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 456           inlinable = false;
 457         }
 458       /* If explicit optimize attribute are not used, the mismatch is caused
 459          by different command line options used to build different units.
 460          Do not care about COMDAT functions - those are intended to be
 461          optimized with the optimization flags of module they are used in.
 462          Also do not care about mixing up size/speed optimization when
 463          DECL_DISREGARD_INLINE_LIMITS is set.  */
 464       else if ((callee->merged_comdat
 465                 && !lookup_attribute ("optimize",
 466                                       DECL_ATTRIBUTES (caller->decl)))
 467                || DECL_DISREGARD_INLINE_LIMITS (callee->decl))
 468         ;
 469       /* If mismatch is caused by merging two LTO units with different
 470          optimizationflags we want to be bit nicer.  However never inline
 471          if one of functions is not optimized at all.  */
 472       else if (!opt_for_fn (callee->decl, optimize)
 473                || !opt_for_fn (caller->decl, optimize))
 474         {
 475           e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 476           inlinable = false;
 477         }
 478       /* If callee is optimized for size and caller is not, allow inlining if
 479          code shrinks or we are in MAX_INLINE_INSNS_SINGLE limit and callee
 480          is inline (and thus likely an unified comdat).  This will allow caller
 481          to run faster.  */
 482       else if (opt_for_fn (callee->decl, optimize_size)
 483                > opt_for_fn (caller->decl, optimize_size))
 484         {
 485           int growth = estimate_edge_growth (e);
 486           if (growth > 0
 487               && (!DECL_DECLARED_INLINE_P (callee->decl)
 488                   && growth >= MAX (MAX_INLINE_INSNS_SINGLE,
 489                                     MAX_INLINE_INSNS_AUTO)))
 490             {
 491               e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 492               inlinable = false;
 493             }
 494         }
 495       /* If callee is more aggressively optimized for performance than caller,
 496          we generally want to inline only cheap (runtime wise) functions.  */
 497       else if (opt_for_fn (callee->decl, optimize_size)
 498                < opt_for_fn (caller->decl, optimize_size)
 499                || (opt_for_fn (callee->decl, optimize)
 500                    > opt_for_fn (caller->decl, optimize)))
 501         {
 502           if (estimate_edge_time (e)
 503               >= 20 + inline_edge_summary (e)->call_stmt_time)
 504             {
 505               e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 506               inlinable = false;
 507             }
 508         }
 509
 510     }
 511
 512   if (!inlinable && report)
 513     report_inline_failed_reason (e);
 514   return inlinable;
 515 }
 516
 517
 518 /* Return true if the edge E is inlinable during early inlining.  */
 519
 520 static bool
 521 can_early_inline_edge_p (struct cgraph_edge *e)
 522 {
 523   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 524   /* Early inliner might get called at WPA stage when IPA pass adds new
 525      function.  In this case we can not really do any of early inlining
 526      because function bodies are missing.  */
 527   if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
 528     return false;
 529   if (!gimple_has_body_p (callee->decl))
 530     {
 531       e->inline_failed = CIF_BODY_NOT_AVAILABLE;
 532       return false;
 533     }
 534   /* In early inliner some of callees may not be in SSA form yet
 535      (i.e. the callgraph is cyclic and we did not process
 536      the callee by early inliner, yet).  We don't have CIF code for this
 537      case; later we will re-do the decision in the real inliner.  */
 538   if (!gimple_in_ssa_p (DECL_STRUCT_FUNCTION (e->caller->decl))
 539       || !gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->decl)))
 540     {
 541       if (dump_file)
 542         fprintf (dump_file, "  edge not inlinable: not in SSA form\n");
 543       return false;
 544     }
 545   if (!can_inline_edge_p (e, true, false, true))
 546     return false;
 547   return true;
 548 }
 549
 550
 551 /* Return number of calls in N.  Ignore cheap builtins.  */
 552
 553 static int
 554 num_calls (struct cgraph_node *n)
 555 {
 556   struct cgraph_edge *e;
 557   int num = 0;
 558
 559   for (e = n->callees; e; e = e->next_callee)
 560     if (!is_inexpensive_builtin (e->callee->decl))
 561       num++;
 562   return num;
 563 }
 564
 565
 566 /* Return true if we are interested in inlining small function.  */
 567
 568 static bool
 569 want_early_inline_function_p (struct cgraph_edge *e)
 570 {
 571   bool want_inline = true;
 572   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 573
 574   if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
 575     ;
 576   /* For AutoFDO, we need to make sure that before profile summary, all
 577      hot paths' IR look exactly the same as profiled binary. As a result,
 578      in einliner, we will disregard size limit and inline those callsites
 579      that are:
 580        * inlined in the profiled binary, and
 581        * the cloned callee has enough samples to be considered "hot".  */
 582   else if (flag_auto_profile && afdo_callsite_hot_enough_for_early_inline (e))
 583     ;
 584   else if (!DECL_DECLARED_INLINE_P (callee->decl)
 585            && !opt_for_fn (e->caller->decl, flag_inline_small_functions))
 586     {
 587       e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
 588       report_inline_failed_reason (e);
 589       want_inline = false;
 590     }
 591   else
 592     {
 593       int growth = estimate_edge_growth (e);
 594       int n;
 595
 596       if (growth <= 0)
 597         ;
 598       else if (!e->maybe_hot_p ()
 599                && growth > 0)
 600         {
 601           if (dump_file)
 602             fprintf (dump_file, "  will not early inline: %s/%i->%s/%i, "
 603                      "call is cold and code would grow by %i\n",
 604                      xstrdup_for_dump (e->caller->name ()),
 605                      e->caller->order,
 606                      xstrdup_for_dump (callee->name ()), callee->order,
 607                      growth);
 608           want_inline = false;
 609         }
 610       else if (growth > PARAM_VALUE (PARAM_EARLY_INLINING_INSNS))
 611         {
 612           if (dump_file)
 613             fprintf (dump_file, "  will not early inline: %s/%i->%s/%i, "
 614                      "growth %i exceeds --param early-inlining-insns\n",
 615                      xstrdup_for_dump (e->caller->name ()),
 616                      e->caller->order,
 617                      xstrdup_for_dump (callee->name ()), callee->order,
 618                      growth);
 619           want_inline = false;
 620         }
 621       else if ((n = num_calls (callee)) != 0
 622                && growth * (n + 1) > PARAM_VALUE (PARAM_EARLY_INLINING_INSNS))
 623         {
 624           if (dump_file)
 625             fprintf (dump_file, "  will not early inline: %s/%i->%s/%i, "
 626                      "growth %i exceeds --param early-inlining-insns "
 627                      "divided by number of calls\n",
 628                      xstrdup_for_dump (e->caller->name ()),
 629                      e->caller->order,
 630                      xstrdup_for_dump (callee->name ()), callee->order,
 631                      growth);
 632           want_inline = false;
 633         }
 634     }
 635   return want_inline;
 636 }
 637
 638 /* Compute time of the edge->caller + edge->callee execution when inlining
 639    does not happen.  */
 640
 641 inline sreal
 642 compute_uninlined_call_time (struct cgraph_edge *edge,
 643                              sreal uninlined_call_time)
 644 {
 645   cgraph_node *caller = (edge->caller->global.inlined_to
 646                          ? edge->caller->global.inlined_to
 647                          : edge->caller);
 648
 649   if (edge->count && caller->count)
 650     uninlined_call_time *= (sreal)edge->count / caller->count;
 651   if (edge->frequency)
 652     uninlined_call_time *= cgraph_freq_base_rec * edge->frequency;
 653   else
 654     uninlined_call_time = uninlined_call_time >> 11;
 655
 656   sreal caller_time = inline_summaries->get (caller)->time;
 657   return uninlined_call_time + caller_time;
 658 }
 659
 660 /* Same as compute_uinlined_call_time but compute time when inlining
 661    does happen.  */
 662
 663 inline sreal
 664 compute_inlined_call_time (struct cgraph_edge *edge,
 665                            sreal time)
 666 {
 667   cgraph_node *caller = (edge->caller->global.inlined_to
 668                          ? edge->caller->global.inlined_to
 669                          : edge->caller);
 670   sreal caller_time = inline_summaries->get (caller)->time;
 671
 672   if (edge->count && caller->count)
 673     time *= (sreal)edge->count / caller->count;
 674   if (edge->frequency)
 675     time *= cgraph_freq_base_rec * edge->frequency;
 676   else
 677     time = time >> 11;
 678
 679   /* This calculation should match one in ipa-inline-analysis.c
 680      (estimate_edge_size_and_time).  */
 681   time -= (sreal) edge->frequency
 682            * inline_edge_summary (edge)->call_stmt_time / CGRAPH_FREQ_BASE;
 683   time += caller_time;
 684   if (time <= 0)
 685     time = ((sreal) 1) >> 8;
 686   gcc_checking_assert (time >= 0);
 687   return time;
 688 }
 689
 690 /* Return true if the speedup for inlining E is bigger than
 691    PARAM_MAX_INLINE_MIN_SPEEDUP.  */
 692
 693 static bool
 694 big_speedup_p (struct cgraph_edge *e)
 695 {
 696   sreal unspec_time;
 697   sreal spec_time = estimate_edge_time (e, &unspec_time);
 698   sreal time = compute_uninlined_call_time (e, unspec_time);
 699   sreal inlined_time = compute_inlined_call_time (e, spec_time);
 700
 701   if (time - inlined_time
 702       > (sreal) (time * PARAM_VALUE (PARAM_INLINE_MIN_SPEEDUP))
 703          * percent_rec)
 704     return true;
 705   return false;
 706 }
 707
 708 /* Return true if we are interested in inlining small function.
 709    When REPORT is true, report reason to dump file.  */
 710
 711 static bool
 712 want_inline_small_function_p (struct cgraph_edge *e, bool report)
 713 {
 714   bool want_inline = true;
 715   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 716
 717   if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
 718     ;
 719   else if (!DECL_DECLARED_INLINE_P (callee->decl)
 720            && !opt_for_fn (e->caller->decl, flag_inline_small_functions))
 721     {
 722       e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
 723       want_inline = false;
 724     }
 725   /* Do fast and conservative check if the function can be good
 726      inline candidate.  At the moment we allow inline hints to
 727      promote non-inline functions to inline and we increase
 728      MAX_INLINE_INSNS_SINGLE 16-fold for inline functions.  */
 729   else if ((!DECL_DECLARED_INLINE_P (callee->decl)
 730            && (!e->count || !e->maybe_hot_p ()))
 731            && inline_summaries->get (callee)->min_size
 732                 - inline_edge_summary (e)->call_stmt_size
 733               > MAX (MAX_INLINE_INSNS_SINGLE, MAX_INLINE_INSNS_AUTO))
 734     {
 735       e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_LIMIT;
 736       want_inline = false;
 737     }
 738   else if ((DECL_DECLARED_INLINE_P (callee->decl) || e->count)
 739            && inline_summaries->get (callee)->min_size
 740                 - inline_edge_summary (e)->call_stmt_size
 741               > 16 * MAX_INLINE_INSNS_SINGLE)
 742     {
 743       e->inline_failed = (DECL_DECLARED_INLINE_P (callee->decl)
 744                           ? CIF_MAX_INLINE_INSNS_SINGLE_LIMIT
 745                           : CIF_MAX_INLINE_INSNS_AUTO_LIMIT);
 746       want_inline = false;
 747     }
 748   else
 749     {
 750       int growth = estimate_edge_growth (e);
 751       inline_hints hints = estimate_edge_hints (e);
 752       bool big_speedup = big_speedup_p (e);
 753
 754       if (growth <= 0)
 755         ;
 756       /* Apply MAX_INLINE_INSNS_SINGLE limit.  Do not do so when
 757          hints suggests that inlining given function is very profitable.  */
 758       else if (DECL_DECLARED_INLINE_P (callee->decl)
 759                && growth >= MAX_INLINE_INSNS_SINGLE
 760                && ((!big_speedup
 761                     && !(hints & (INLINE_HINT_indirect_call
 762                                   | INLINE_HINT_known_hot
 763                                   | INLINE_HINT_loop_iterations
 764                                   | INLINE_HINT_array_index
 765                                   | INLINE_HINT_loop_stride)))
 766                    || growth >= MAX_INLINE_INSNS_SINGLE * 16))
 767         {
 768           e->inline_failed = CIF_MAX_INLINE_INSNS_SINGLE_LIMIT;
 769           want_inline = false;
 770         }
 771       else if (!DECL_DECLARED_INLINE_P (callee->decl)
 772                && !opt_for_fn (e->caller->decl, flag_inline_functions))
 773         {
 774           /* growth_likely_positive is expensive, always test it last.  */
 775           if (growth >= MAX_INLINE_INSNS_SINGLE
 776               || growth_likely_positive (callee, growth))
 777             {
 778               e->inline_failed = CIF_NOT_DECLARED_INLINED;
 779               want_inline = false;
 780             }
 781         }
 782       /* Apply MAX_INLINE_INSNS_AUTO limit for functions not declared inline
 783          Upgrade it to MAX_INLINE_INSNS_SINGLE when hints suggests that
 784          inlining given function is very profitable.  */
 785       else if (!DECL_DECLARED_INLINE_P (callee->decl)
 786                && !big_speedup
 787                && !(hints & INLINE_HINT_known_hot)
 788                && growth >= ((hints & (INLINE_HINT_indirect_call
 789                                        | INLINE_HINT_loop_iterations
 790                                        | INLINE_HINT_array_index
 791                                        | INLINE_HINT_loop_stride))
 792                              ? MAX (MAX_INLINE_INSNS_AUTO,
 793                                     MAX_INLINE_INSNS_SINGLE)
 794                              : MAX_INLINE_INSNS_AUTO))
 795         {
 796           /* growth_likely_positive is expensive, always test it last.  */
 797           if (growth >= MAX_INLINE_INSNS_SINGLE
 798               || growth_likely_positive (callee, growth))
 799             {
 800               e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_LIMIT;
 801               want_inline = false;
 802             }
 803         }
 804       /* If call is cold, do not inline when function body would grow. */
 805       else if (!e->maybe_hot_p ()
 806                && (growth >= MAX_INLINE_INSNS_SINGLE
 807                    || growth_likely_positive (callee, growth)))
 808         {
 809           e->inline_failed = CIF_UNLIKELY_CALL;
 810           want_inline = false;
 811         }
 812     }
 813   if (!want_inline && report)
 814     report_inline_failed_reason (e);
 815   return want_inline;
 816 }
 817
 818 /* EDGE is self recursive edge.
 819    We hand two cases - when function A is inlining into itself
 820    or when function A is being inlined into another inliner copy of function
 821    A within function B.
 822
 823    In first case OUTER_NODE points to the toplevel copy of A, while
 824    in the second case OUTER_NODE points to the outermost copy of A in B.
 825
 826    In both cases we want to be extra selective since
 827    inlining the call will just introduce new recursive calls to appear.  */
 828
 829 static bool
 830 want_inline_self_recursive_call_p (struct cgraph_edge *edge,
 831                                    struct cgraph_node *outer_node,
 832                                    bool peeling,
 833                                    int depth)
 834 {
 835   char const *reason = NULL;
 836   bool want_inline = true;
 837   int caller_freq = CGRAPH_FREQ_BASE;
 838   int max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH_AUTO);
 839
 840   if (DECL_DECLARED_INLINE_P (edge->caller->decl))
 841     max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH);
 842
 843   if (!edge->maybe_hot_p ())
 844     {
 845       reason = "recursive call is cold";
 846       want_inline = false;
 847     }
 848   else if (max_count && !outer_node->count)
 849     {
 850       reason = "not executed in profile";
 851       want_inline = false;
 852     }
 853   else if (depth > max_depth)
 854     {
 855       reason = "--param max-inline-recursive-depth exceeded.";
 856       want_inline = false;
 857     }
 858
 859   if (outer_node->global.inlined_to)
 860     caller_freq = outer_node->callers->frequency;
 861
 862   if (!caller_freq)
 863     {
 864       reason = "function is inlined and unlikely";
 865       want_inline = false;
 866     }
 867
 868   if (!want_inline)
 869     ;
 870   /* Inlining of self recursive function into copy of itself within other function
 871      is transformation similar to loop peeling.
 872
 873      Peeling is profitable if we can inline enough copies to make probability
 874      of actual call to the self recursive function very small.  Be sure that
 875      the probability of recursion is small.
 876
 877      We ensure that the frequency of recursing is at most 1 - (1/max_depth).
 878      This way the expected number of recision is at most max_depth.  */
 879   else if (peeling)
 880     {
 881       int max_prob = CGRAPH_FREQ_BASE - ((CGRAPH_FREQ_BASE + max_depth - 1)
 882                                          / max_depth);
 883       int i;
 884       for (i = 1; i < depth; i++)
 885         max_prob = max_prob * max_prob / CGRAPH_FREQ_BASE;
 886       if (max_count
 887           && (edge->count * CGRAPH_FREQ_BASE / outer_node->count
 888               >= max_prob))
 889         {
 890           reason = "profile of recursive call is too large";
 891           want_inline = false;
 892         }
 893       if (!max_count
 894           && (edge->frequency * CGRAPH_FREQ_BASE / caller_freq
 895               >= max_prob))
 896         {
 897           reason = "frequency of recursive call is too large";
 898           want_inline = false;
 899         }
 900     }
 901   /* Recursive inlining, i.e. equivalent of unrolling, is profitable if recursion
 902      depth is large.  We reduce function call overhead and increase chances that
 903      things fit in hardware return predictor.
 904
 905      Recursive inlining might however increase cost of stack frame setup
 906      actually slowing down functions whose recursion tree is wide rather than
 907      deep.
 908
 909      Deciding reliably on when to do recursive inlining without profile feedback
 910      is tricky.  For now we disable recursive inlining when probability of self
 911      recursion is low.
 912
 913      Recursive inlining of self recursive call within loop also results in large loop
 914      depths that generally optimize badly.  We may want to throttle down inlining
 915      in those cases.  In particular this seems to happen in one of libstdc++ rb tree
 916      methods.  */
 917   else
 918     {
 919       if (max_count
 920           && (edge->count * 100 / outer_node->count
 921               <= PARAM_VALUE (PARAM_MIN_INLINE_RECURSIVE_PROBABILITY)))
 922         {
 923           reason = "profile of recursive call is too small";
 924           want_inline = false;
 925         }
 926       else if (!max_count
 927                && (edge->frequency * 100 / caller_freq
 928                    <= PARAM_VALUE (PARAM_MIN_INLINE_RECURSIVE_PROBABILITY)))
 929         {
 930           reason = "frequency of recursive call is too small";
 931           want_inline = false;
 932         }
 933     }
 934   if (!want_inline && dump_file)
 935     fprintf (dump_file, "   not inlining recursively: %s\n", reason);
 936   return want_inline;
 937 }
 938
 939 /* Return true when NODE has uninlinable caller;
 940    set HAS_HOT_CALL if it has hot call.
 941    Worker for cgraph_for_node_and_aliases.  */
 942
 943 static bool
 944 check_callers (struct cgraph_node *node, void *has_hot_call)
 945 {
 946   struct cgraph_edge *e;
 947    for (e = node->callers; e; e = e->next_caller)
 948      {
 949        if (!opt_for_fn (e->caller->decl, flag_inline_functions_called_once))
 950          return true;
 951        if (!can_inline_edge_p (e, true))
 952          return true;
 953        if (e->recursive_p ())
 954          return true;
 955        if (!(*(bool *)has_hot_call) && e->maybe_hot_p ())
 956          *(bool *)has_hot_call = true;
 957      }
 958   return false;
 959 }
 960
 961 /* If NODE has a caller, return true.  */
 962
 963 static bool
 964 has_caller_p (struct cgraph_node *node, void *data ATTRIBUTE_UNUSED)
 965 {
 966   if (node->callers)
 967     return true;
 968   return false;
 969 }
 970
 971 /* Decide if inlining NODE would reduce unit size by eliminating
 972    the offline copy of function.
 973    When COLD is true the cold calls are considered, too.  */
 974
 975 static bool
 976 want_inline_function_to_all_callers_p (struct cgraph_node *node, bool cold)
 977 {
 978   bool has_hot_call = false;
 979
 980   /* Aliases gets inlined along with the function they alias.  */
 981   if (node->alias)
 982     return false;
 983   /* Already inlined?  */
 984   if (node->global.inlined_to)
 985     return false;
 986   /* Does it have callers?  */
 987   if (!node->call_for_symbol_and_aliases (has_caller_p, NULL, true))
 988     return false;
 989   /* Inlining into all callers would increase size?  */
 990   if (estimate_growth (node) > 0)
 991     return false;
 992   /* All inlines must be possible.  */
 993   if (node->call_for_symbol_and_aliases (check_callers, &has_hot_call,
 994                                          true))
 995     return false;
 996   if (!cold && !has_hot_call)
 997     return false;
 998   return true;
 999 }
1000
1001 /* A cost model driving the inlining heuristics in a way so the edges with
1002    smallest badness are inlined first.  After each inlining is performed
1003    the costs of all caller edges of nodes affected are recomputed so the
1004    metrics may accurately depend on values such as number of inlinable callers
1005    of the function or function body size.  */
1006
1007 static sreal
1008 edge_badness (struct cgraph_edge *edge, bool dump)
1009 {
1010   sreal badness;
1011   int growth;
1012   sreal edge_time, unspec_edge_time;
1013   struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
1014   struct inline_summary *callee_info = inline_summaries->get (callee);
1015   inline_hints hints;
1016   cgraph_node *caller = (edge->caller->global.inlined_to
1017                          ? edge->caller->global.inlined_to
1018                          : edge->caller);
1019
1020   growth = estimate_edge_growth (edge);
1021   edge_time = estimate_edge_time (edge, &unspec_edge_time);
1022   hints = estimate_edge_hints (edge);
1023   gcc_checking_assert (edge_time >= 0);
1024   /* Check that inlined time is better, but tolerate some roundoff issues.  */
1025   gcc_checking_assert ((edge_time - callee_info->time).to_int () <= 0);
1026   gcc_checking_assert (growth <= callee_info->size);
1027
1028   if (dump)
1029     {
1030       fprintf (dump_file, "    Badness calculation for %s/%i -> %s/%i\n",
1031                xstrdup_for_dump (edge->caller->name ()),
1032                edge->caller->order,
1033                xstrdup_for_dump (callee->name ()),
1034                edge->callee->order);
1035       fprintf (dump_file, "      size growth %i, time %f unspec %f ",
1036                growth,
1037                edge_time.to_double (),
1038                unspec_edge_time.to_double ());
1039       dump_inline_hints (dump_file, hints);
1040       if (big_speedup_p (edge))
1041         fprintf (dump_file, " big_speedup");
1042       fprintf (dump_file, "\n");
1043     }
1044
1045   /* Always prefer inlining saving code size.  */
1046   if (growth <= 0)
1047     {
1048       badness = (sreal) (-SREAL_MIN_SIG + growth) << (SREAL_MAX_EXP / 256);
1049       if (dump)
1050         fprintf (dump_file, "      %f: Growth %d <= 0\n", badness.to_double (),
1051                  growth);
1052     }
1053    /* Inlining into EXTERNAL functions is not going to change anything unless
1054       they are themselves inlined.  */
1055    else if (DECL_EXTERNAL (caller->decl))
1056     {
1057       if (dump)
1058         fprintf (dump_file, "      max: function is external\n");
1059       return sreal::max ();
1060     }
1061   /* When profile is available. Compute badness as:
1062
1063                  time_saved * caller_count
1064      goodness =  -------------------------------------------------
1065                  growth_of_caller * overall_growth * combined_size
1066
1067      badness = - goodness
1068
1069      Again use negative value to make calls with profile appear hotter
1070      then calls without.
1071   */
1072   else if (opt_for_fn (caller->decl, flag_guess_branch_prob) || caller->count)
1073     {
1074       sreal numerator, denominator;
1075       int overall_growth;
1076
1077       numerator = (compute_uninlined_call_time (edge, unspec_edge_time)
1078                    - compute_inlined_call_time (edge, edge_time));
1079       if (numerator == 0)
1080         numerator = ((sreal) 1 >> 8);
1081       if (caller->count)
1082         numerator *= caller->count;
1083       else if (opt_for_fn (caller->decl, flag_branch_probabilities))
1084         numerator = numerator >> 11;
1085       denominator = growth;
1086
1087       overall_growth = callee_info->growth;
1088
1089       /* Look for inliner wrappers of the form:
1090
1091          inline_caller ()
1092            {
1093              do_fast_job...
1094              if (need_more_work)
1095                noninline_callee ();
1096            }
1097          Withhout panilizing this case, we usually inline noninline_callee
1098          into the inline_caller because overall_growth is small preventing
1099          further inlining of inline_caller.
1100
1101          Penalize only callgraph edges to functions with small overall
1102          growth ...
1103         */
1104       if (growth > overall_growth
1105           /* ... and having only one caller which is not inlined ... */
1106           && callee_info->single_caller
1107           && !edge->caller->global.inlined_to
1108           /* ... and edges executed only conditionally ... */
1109           && edge->frequency < CGRAPH_FREQ_BASE
1110           /* ... consider case where callee is not inline but caller is ... */
1111           && ((!DECL_DECLARED_INLINE_P (edge->callee->decl)
1112                && DECL_DECLARED_INLINE_P (caller->decl))
1113               /* ... or when early optimizers decided to split and edge
1114                  frequency still indicates splitting is a win ... */
1115               || (callee->split_part && !caller->split_part
1116                   && edge->frequency
1117                      < CGRAPH_FREQ_BASE
1118                        * PARAM_VALUE
1119                           (PARAM_PARTIAL_INLINING_ENTRY_PROBABILITY) / 100
1120                   /* ... and do not overwrite user specified hints.   */
1121                   && (!DECL_DECLARED_INLINE_P (edge->callee->decl)
1122                       || DECL_DECLARED_INLINE_P (caller->decl)))))
1123         {
1124           struct inline_summary *caller_info = inline_summaries->get (caller);
1125           int caller_growth = caller_info->growth;
1126
1127           /* Only apply the penalty when caller looks like inline candidate,
1128              and it is not called once and.  */
1129           if (!caller_info->single_caller && overall_growth < caller_growth
1130               && caller_info->inlinable
1131               && caller_info->size
1132                  < (DECL_DECLARED_INLINE_P (caller->decl)
1133                     ? MAX_INLINE_INSNS_SINGLE : MAX_INLINE_INSNS_AUTO))
1134             {
1135               if (dump)
1136                 fprintf (dump_file,
1137                          "     Wrapper penalty. Increasing growth %i to %i\n",
1138                          overall_growth, caller_growth);
1139               overall_growth = caller_growth;
1140             }
1141         }
1142       if (overall_growth > 0)
1143         {
1144           /* Strongly preffer functions with few callers that can be inlined
1145              fully.  The square root here leads to smaller binaries at average.
1146              Watch however for extreme cases and return to linear function
1147              when growth is large.  */
1148           if (overall_growth < 256)
1149             overall_growth *= overall_growth;
1150           else
1151             overall_growth += 256 * 256 - 256;
1152           denominator *= overall_growth;
1153         }
1154       denominator *= inline_summaries->get (caller)->self_size + growth;
1155
1156       badness = - numerator / denominator;
1157
1158       if (dump)
1159         {
1160           fprintf (dump_file,
1161                    "      %f: guessed profile. frequency %f, count %" PRId64
1162                    " caller count %" PRId64
1163                    " time w/o inlining %f, time with inlining %f"
1164                    " overall growth %i (current) %i (original)"
1165                    " %i (compensated)\n",
1166                    badness.to_double (),
1167                   (double)edge->frequency / CGRAPH_FREQ_BASE,
1168                    edge->count, caller->count,
1169                    compute_uninlined_call_time (edge,
1170                                                 unspec_edge_time).to_double (),
1171                    compute_inlined_call_time (edge, edge_time).to_double (),
1172                    estimate_growth (callee),
1173                    callee_info->growth, overall_growth);
1174         }
1175     }
1176   /* When function local profile is not available or it does not give
1177      useful information (ie frequency is zero), base the cost on
1178      loop nest and overall size growth, so we optimize for overall number
1179      of functions fully inlined in program.  */
1180   else
1181     {
1182       int nest = MIN (inline_edge_summary (edge)->loop_depth, 8);
1183       badness = growth;
1184
1185       /* Decrease badness if call is nested.  */
1186       if (badness > 0)
1187         badness = badness >> nest;
1188       else
1189         badness = badness << nest;
1190       if (dump)
1191         fprintf (dump_file, "      %f: no profile. nest %i\n",
1192                  badness.to_double (), nest);
1193     }
1194   gcc_checking_assert (badness != 0);
1195
1196   if (edge->recursive_p ())
1197     badness = badness.shift (badness > 0 ? 4 : -4);
1198   if ((hints & (INLINE_HINT_indirect_call
1199                 | INLINE_HINT_loop_iterations
1200                 | INLINE_HINT_array_index
1201                 | INLINE_HINT_loop_stride))
1202       || callee_info->growth <= 0)
1203     badness = badness.shift (badness > 0 ? -2 : 2);
1204   if (hints & (INLINE_HINT_same_scc))
1205     badness = badness.shift (badness > 0 ? 3 : -3);
1206   else if (hints & (INLINE_HINT_in_scc))
1207     badness = badness.shift (badness > 0 ? 2 : -2);
1208   else if (hints & (INLINE_HINT_cross_module))
1209     badness = badness.shift (badness > 0 ? 1 : -1);
1210   if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
1211     badness = badness.shift (badness > 0 ? -4 : 4);
1212   else if ((hints & INLINE_HINT_declared_inline))
1213     badness = badness.shift (badness > 0 ? -3 : 3);
1214   if (dump)
1215     fprintf (dump_file, "      Adjusted by hints %f\n", badness.to_double ());
1216   return badness;
1217 }
1218
1219 /* Recompute badness of EDGE and update its key in HEAP if needed.  */
1220 static inline void
1221 update_edge_key (edge_heap_t *heap, struct cgraph_edge *edge)
1222 {
1223   sreal badness = edge_badness (edge, false);
1224   if (edge->aux)
1225     {
1226       edge_heap_node_t *n = (edge_heap_node_t *) edge->aux;
1227       gcc_checking_assert (n->get_data () == edge);
1228
1229       /* fibonacci_heap::replace_key does busy updating of the
1230          heap that is unnecesarily expensive.
1231          We do lazy increases: after extracting minimum if the key
1232          turns out to be out of date, it is re-inserted into heap
1233          with correct value.  */
1234       if (badness < n->get_key ())
1235         {
1236           if (dump_file && (dump_flags & TDF_DETAILS))
1237             {
1238               fprintf (dump_file,
1239                        "  decreasing badness %s/%i -> %s/%i, %f"
1240                        " to %f\n",
1241                        xstrdup_for_dump (edge->caller->name ()),
1242                        edge->caller->order,
1243                        xstrdup_for_dump (edge->callee->name ()),
1244                        edge->callee->order,
1245                        n->get_key ().to_double (),
1246                        badness.to_double ());
1247             }
1248           heap->decrease_key (n, badness);
1249         }
1250     }
1251   else
1252     {
1253        if (dump_file && (dump_flags & TDF_DETAILS))
1254          {
1255            fprintf (dump_file,
1256                     "  enqueuing call %s/%i -> %s/%i, badness %f\n",
1257                     xstrdup_for_dump (edge->caller->name ()),
1258                     edge->caller->order,
1259                     xstrdup_for_dump (edge->callee->name ()),
1260                     edge->callee->order,
1261                     badness.to_double ());
1262          }
1263       edge->aux = heap->insert (badness, edge);
1264     }
1265 }
1266
1267
1268 /* NODE was inlined.
1269    All caller edges needs to be resetted because
1270    size estimates change. Similarly callees needs reset
1271    because better context may be known.  */
1272
1273 static void
1274 reset_edge_caches (struct cgraph_node *node)
1275 {
1276   struct cgraph_edge *edge;
1277   struct cgraph_edge *e = node->callees;
1278   struct cgraph_node *where = node;
1279   struct ipa_ref *ref;
1280
1281   if (where->global.inlined_to)
1282     where = where->global.inlined_to;
1283
1284   for (edge = where->callers; edge; edge = edge->next_caller)
1285     if (edge->inline_failed)
1286       reset_edge_growth_cache (edge);
1287
1288   FOR_EACH_ALIAS (where, ref)
1289     reset_edge_caches (dyn_cast <cgraph_node *> (ref->referring));
1290
1291   if (!e)
1292     return;
1293
1294   while (true)
1295     if (!e->inline_failed && e->callee->callees)
1296       e = e->callee->callees;
1297     else
1298       {
1299         if (e->inline_failed)
1300           reset_edge_growth_cache (e);
1301         if (e->next_callee)
1302           e = e->next_callee;
1303         else
1304           {
1305             do
1306               {
1307                 if (e->caller == node)
1308                   return;
1309                 e = e->caller->callers;
1310               }
1311             while (!e->next_callee);
1312             e = e->next_callee;
1313           }
1314       }
1315 }
1316
1317 /* Recompute HEAP nodes for each of caller of NODE.
1318    UPDATED_NODES track nodes we already visited, to avoid redundant work.
1319    When CHECK_INLINABLITY_FOR is set, re-check for specified edge that
1320    it is inlinable. Otherwise check all edges.  */
1321
1322 static void
1323 update_caller_keys (edge_heap_t *heap, struct cgraph_node *node,
1324                     bitmap updated_nodes,
1325                     struct cgraph_edge *check_inlinablity_for)
1326 {
1327   struct cgraph_edge *edge;
1328   struct ipa_ref *ref;
1329
1330   if ((!node->alias && !inline_summaries->get (node)->inlinable)
1331       || node->global.inlined_to)
1332     return;
1333   if (!bitmap_set_bit (updated_nodes, node->uid))
1334     return;
1335
1336   FOR_EACH_ALIAS (node, ref)
1337     {
1338       struct cgraph_node *alias = dyn_cast <cgraph_node *> (ref->referring);
1339       update_caller_keys (heap, alias, updated_nodes, check_inlinablity_for);
1340     }
1341
1342   for (edge = node->callers; edge; edge = edge->next_caller)
1343     if (edge->inline_failed)
1344       {
1345         if (!check_inlinablity_for
1346             || check_inlinablity_for == edge)
1347           {
1348             if (can_inline_edge_p (edge, false)
1349                 && want_inline_small_function_p (edge, false))
1350               update_edge_key (heap, edge);
1351             else if (edge->aux)
1352               {
1353                 report_inline_failed_reason (edge);
1354                 heap->delete_node ((edge_heap_node_t *) edge->aux);
1355                 edge->aux = NULL;
1356               }
1357           }
1358         else if (edge->aux)
1359           update_edge_key (heap, edge);
1360       }
1361 }
1362
1363 /* Recompute HEAP nodes for each uninlined call in NODE.
1364    This is used when we know that edge badnesses are going only to increase
1365    (we introduced new call site) and thus all we need is to insert newly
1366    created edges into heap.  */
1367
1368 static void
1369 update_callee_keys (edge_heap_t *heap, struct cgraph_node *node,
1370                     bitmap updated_nodes)
1371 {
1372   struct cgraph_edge *e = node->callees;
1373
1374   if (!e)
1375     return;
1376   while (true)
1377     if (!e->inline_failed && e->callee->callees)
1378       e = e->callee->callees;
1379     else
1380       {
1381         enum availability avail;
1382         struct cgraph_node *callee;
1383         /* We do not reset callee growth cache here.  Since we added a new call,
1384            growth chould have just increased and consequentely badness metric
1385            don't need updating.  */
1386         if (e->inline_failed
1387             && (callee = e->callee->ultimate_alias_target (&avail, e->caller))
1388             && inline_summaries->get (callee)->inlinable
1389             && avail >= AVAIL_AVAILABLE
1390             && !bitmap_bit_p (updated_nodes, callee->uid))
1391           {
1392             if (can_inline_edge_p (e, false)
1393                 && want_inline_small_function_p (e, false))
1394               update_edge_key (heap, e);
1395             else if (e->aux)
1396               {
1397                 report_inline_failed_reason (e);
1398                 heap->delete_node ((edge_heap_node_t *) e->aux);
1399                 e->aux = NULL;
1400               }
1401           }
1402         if (e->next_callee)
1403           e = e->next_callee;
1404         else
1405           {
1406             do
1407               {
1408                 if (e->caller == node)
1409                   return;
1410                 e = e->caller->callers;
1411               }
1412             while (!e->next_callee);
1413             e = e->next_callee;
1414           }
1415       }
1416 }
1417
1418 /* Enqueue all recursive calls from NODE into priority queue depending on
1419    how likely we want to recursively inline the call.  */
1420
1421 static void
1422 lookup_recursive_calls (struct cgraph_node *node, struct cgraph_node *where,
1423                         edge_heap_t *heap)
1424 {
1425   struct cgraph_edge *e;
1426   enum availability avail;
1427
1428   for (e = where->callees; e; e = e->next_callee)
1429     if (e->callee == node
1430         || (e->callee->ultimate_alias_target (&avail, e->caller) == node
1431             && avail > AVAIL_INTERPOSABLE))
1432       {
1433         /* When profile feedback is available, prioritize by expected number
1434            of calls.  */
1435         heap->insert (!max_count ? -e->frequency
1436                       : -(e->count / ((max_count + (1<<24) - 1) / (1<<24))),
1437                       e);
1438       }
1439   for (e = where->callees; e; e = e->next_callee)
1440     if (!e->inline_failed)
1441       lookup_recursive_calls (node, e->callee, heap);
1442 }
1443
1444 /* Decide on recursive inlining: in the case function has recursive calls,
1445    inline until body size reaches given argument.  If any new indirect edges
1446    are discovered in the process, add them to *NEW_EDGES, unless NEW_EDGES
1447    is NULL.  */
1448
1449 static bool
1450 recursive_inlining (struct cgraph_edge *edge,
1451                     vec<cgraph_edge *> *new_edges)
1452 {
1453   int limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE_AUTO);
1454   edge_heap_t heap (sreal::min ());
1455   struct cgraph_node *node;
1456   struct cgraph_edge *e;
1457   struct cgraph_node *master_clone = NULL, *next;
1458   int depth = 0;
1459   int n = 0;
1460
1461   node = edge->caller;
1462   if (node->global.inlined_to)
1463     node = node->global.inlined_to;
1464
1465   if (DECL_DECLARED_INLINE_P (node->decl))
1466     limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE);
1467
1468   /* Make sure that function is small enough to be considered for inlining.  */
1469   if (estimate_size_after_inlining (node, edge)  >= limit)
1470     return false;
1471   lookup_recursive_calls (node, node, &heap);
1472   if (heap.empty ())
1473     return false;
1474
1475   if (dump_file)
1476     fprintf (dump_file,
1477              "  Performing recursive inlining on %s\n",
1478              node->name ());
1479
1480   /* Do the inlining and update list of recursive call during process.  */
1481   while (!heap.empty ())
1482     {
1483       struct cgraph_edge *curr = heap.extract_min ();
1484       struct cgraph_node *cnode, *dest = curr->callee;
1485
1486       if (!can_inline_edge_p (curr, true))
1487         continue;
1488
1489       /* MASTER_CLONE is produced in the case we already started modified
1490          the function. Be sure to redirect edge to the original body before
1491          estimating growths otherwise we will be seeing growths after inlining
1492          the already modified body.  */
1493       if (master_clone)
1494         {
1495           curr->redirect_callee (master_clone);
1496           reset_edge_growth_cache (curr);
1497         }
1498
1499       if (estimate_size_after_inlining (node, curr) > limit)
1500         {
1501           curr->redirect_callee (dest);
1502           reset_edge_growth_cache (curr);
1503           break;
1504         }
1505
1506       depth = 1;
1507       for (cnode = curr->caller;
1508            cnode->global.inlined_to; cnode = cnode->callers->caller)
1509         if (node->decl
1510             == curr->callee->ultimate_alias_target ()->decl)
1511           depth++;
1512
1513       if (!want_inline_self_recursive_call_p (curr, node, false, depth))
1514         {
1515           curr->redirect_callee (dest);
1516           reset_edge_growth_cache (curr);
1517           continue;
1518         }
1519
1520       if (dump_file)
1521         {
1522           fprintf (dump_file,
1523                    "   Inlining call of depth %i", depth);
1524           if (node->count)
1525             {
1526               fprintf (dump_file, " called approx. %.2f times per call",
1527                        (double)curr->count / node->count);
1528             }
1529           fprintf (dump_file, "\n");
1530         }
1531       if (!master_clone)
1532         {
1533           /* We need original clone to copy around.  */
1534           master_clone = node->create_clone (node->decl, node->count,
1535             CGRAPH_FREQ_BASE, false, vNULL,
1536             true, NULL, NULL);
1537           for (e = master_clone->callees; e; e = e->next_callee)
1538             if (!e->inline_failed)
1539               clone_inlined_nodes (e, true, false, NULL, CGRAPH_FREQ_BASE);
1540           curr->redirect_callee (master_clone);
1541           reset_edge_growth_cache (curr);
1542         }
1543
1544       inline_call (curr, false, new_edges, &overall_size, true);
1545       lookup_recursive_calls (node, curr->callee, &heap);
1546       n++;
1547     }
1548
1549   if (!heap.empty () && dump_file)
1550     fprintf (dump_file, "    Recursive inlining growth limit met.\n");
1551
1552   if (!master_clone)
1553     return false;
1554
1555   if (dump_file)
1556     fprintf (dump_file,
1557              "\n   Inlined %i times, "
1558              "body grown from size %i to %i, time %f to %f\n", n,
1559              inline_summaries->get (master_clone)->size,
1560              inline_summaries->get (node)->size,
1561              inline_summaries->get (master_clone)->time.to_double (),
1562              inline_summaries->get (node)->time.to_double ());
1563
1564   /* Remove master clone we used for inlining.  We rely that clones inlined
1565      into master clone gets queued just before master clone so we don't
1566      need recursion.  */
1567   for (node = symtab->first_function (); node != master_clone;
1568        node = next)
1569     {
1570       next = symtab->next_function (node);
1571       if (node->global.inlined_to == master_clone)
1572         node->remove ();
1573     }
1574   master_clone->remove ();
1575   return true;
1576 }
1577
1578
1579 /* Given whole compilation unit estimate of INSNS, compute how large we can
1580    allow the unit to grow.  */
1581
1582 static int
1583 compute_max_insns (int insns)
1584 {
1585   int max_insns = insns;
1586   if (max_insns < PARAM_VALUE (PARAM_LARGE_UNIT_INSNS))
1587     max_insns = PARAM_VALUE (PARAM_LARGE_UNIT_INSNS);
1588
1589   return ((int64_t) max_insns
1590           * (100 + PARAM_VALUE (PARAM_INLINE_UNIT_GROWTH)) / 100);
1591 }
1592
1593
1594 /* Compute badness of all edges in NEW_EDGES and add them to the HEAP.  */
1595
1596 static void
1597 add_new_edges_to_heap (edge_heap_t *heap, vec<cgraph_edge *> new_edges)
1598 {
1599   while (new_edges.length () > 0)
1600     {
1601       struct cgraph_edge *edge = new_edges.pop ();
1602
1603       gcc_assert (!edge->aux);
1604       if (edge->inline_failed
1605           && can_inline_edge_p (edge, true)
1606           && want_inline_small_function_p (edge, true))
1607         edge->aux = heap->insert (edge_badness (edge, false), edge);
1608     }
1609 }
1610
1611 /* Remove EDGE from the fibheap.  */
1612
1613 static void
1614 heap_edge_removal_hook (struct cgraph_edge *e, void *data)
1615 {
1616   if (e->aux)
1617     {
1618       ((edge_heap_t *)data)->delete_node ((edge_heap_node_t *)e->aux);
1619       e->aux = NULL;
1620     }
1621 }
1622
1623 /* Return true if speculation of edge E seems useful.
1624    If ANTICIPATE_INLINING is true, be conservative and hope that E
1625    may get inlined.  */
1626
1627 bool
1628 speculation_useful_p (struct cgraph_edge *e, bool anticipate_inlining)
1629 {
1630   enum availability avail;
1631   struct cgraph_node *target = e->callee->ultimate_alias_target (&avail,
1632                                                                  e->caller);
1633   struct cgraph_edge *direct, *indirect;
1634   struct ipa_ref *ref;
1635
1636   gcc_assert (e->speculative && !e->indirect_unknown_callee);
1637
1638   if (!e->maybe_hot_p ())
1639     return false;
1640
1641   /* See if IP optimizations found something potentially useful about the
1642      function.  For now we look only for CONST/PURE flags.  Almost everything
1643      else we propagate is useless.  */
1644   if (avail >= AVAIL_AVAILABLE)
1645     {
1646       int ecf_flags = flags_from_decl_or_type (target->decl);
1647       if (ecf_flags & ECF_CONST)
1648         {
1649           e->speculative_call_info (direct, indirect, ref);
1650           if (!(indirect->indirect_info->ecf_flags & ECF_CONST))
1651             return true;
1652         }
1653       else if (ecf_flags & ECF_PURE)
1654         {
1655           e->speculative_call_info (direct, indirect, ref);
1656           if (!(indirect->indirect_info->ecf_flags & ECF_PURE))
1657             return true;
1658         }
1659     }
1660   /* If we did not managed to inline the function nor redirect
1661      to an ipa-cp clone (that are seen by having local flag set),
1662      it is probably pointless to inline it unless hardware is missing
1663      indirect call predictor.  */
1664   if (!anticipate_inlining && e->inline_failed && !target->local.local)
1665     return false;
1666   /* For overwritable targets there is not much to do.  */
1667   if (e->inline_failed && !can_inline_edge_p (e, false, true))
1668     return false;
1669   /* OK, speculation seems interesting.  */
1670   return true;
1671 }
1672
1673 /* We know that EDGE is not going to be inlined.
1674    See if we can remove speculation.  */
1675
1676 static void
1677 resolve_noninline_speculation (edge_heap_t *edge_heap, struct cgraph_edge *edge)
1678 {
1679   if (edge->speculative && !speculation_useful_p (edge, false))
1680     {
1681       struct cgraph_node *node = edge->caller;
1682       struct cgraph_node *where = node->global.inlined_to
1683                                   ? node->global.inlined_to : node;
1684       bitmap updated_nodes = BITMAP_ALLOC (NULL);
1685
1686       spec_rem += edge->count;
1687       edge->resolve_speculation ();
1688       reset_edge_caches (where);
1689       inline_update_overall_summary (where);
1690       update_caller_keys (edge_heap, where,
1691                           updated_nodes, NULL);
1692       update_callee_keys (edge_heap, where,
1693                           updated_nodes);
1694       BITMAP_FREE (updated_nodes);
1695     }
1696 }
1697
1698 /* Return true if NODE should be accounted for overall size estimate.
1699    Skip all nodes optimized for size so we can measure the growth of hot
1700    part of program no matter of the padding.  */
1701
1702 bool
1703 inline_account_function_p (struct cgraph_node *node)
1704 {
1705    return (!DECL_EXTERNAL (node->decl)
1706            && !opt_for_fn (node->decl, optimize_size)
1707            && node->frequency != NODE_FREQUENCY_UNLIKELY_EXECUTED);
1708 }
1709
1710 /* Count number of callers of NODE and store it into DATA (that
1711    points to int.  Worker for cgraph_for_node_and_aliases.  */
1712
1713 static bool
1714 sum_callers (struct cgraph_node *node, void *data)
1715 {
1716   struct cgraph_edge *e;
1717   int *num_calls = (int *)data;
1718
1719   for (e = node->callers; e; e = e->next_caller)
1720     (*num_calls)++;
1721   return false;
1722 }
1723
1724 /* We use greedy algorithm for inlining of small functions:
1725    All inline candidates are put into prioritized heap ordered in
1726    increasing badness.
1727
1728    The inlining of small functions is bounded by unit growth parameters.  */
1729
1730 static void
1731 inline_small_functions (void)
1732 {
1733   struct cgraph_node *node;
1734   struct cgraph_edge *edge;
1735   edge_heap_t edge_heap (sreal::min ());
1736   bitmap updated_nodes = BITMAP_ALLOC (NULL);
1737   int min_size, max_size;
1738   auto_vec<cgraph_edge *> new_indirect_edges;
1739   int initial_size = 0;
1740   struct cgraph_node **order = XCNEWVEC (cgraph_node *, symtab->cgraph_count);
1741   struct cgraph_edge_hook_list *edge_removal_hook_holder;
1742   new_indirect_edges.create (8);
1743
1744   edge_removal_hook_holder
1745     = symtab->add_edge_removal_hook (&heap_edge_removal_hook, &edge_heap);
1746
1747   /* Compute overall unit size and other global parameters used by badness
1748      metrics.  */
1749
1750   max_count = 0;
1751   ipa_reduced_postorder (order, true, true, NULL);
1752   free (order);
1753
1754   FOR_EACH_DEFINED_FUNCTION (node)
1755     if (!node->global.inlined_to)
1756       {
1757         if (!node->alias && node->analyzed
1758             && (node->has_gimple_body_p () || node->thunk.thunk_p))
1759           {
1760             struct inline_summary *info = inline_summaries->get (node);
1761             struct ipa_dfs_info *dfs = (struct ipa_dfs_info *) node->aux;
1762
1763             /* Do not account external functions, they will be optimized out
1764                if not inlined.  Also only count the non-cold portion of program.  */
1765             if (inline_account_function_p (node))
1766               initial_size += info->size;
1767             info->growth = estimate_growth (node);
1768
1769             int num_calls = 0;
1770             node->call_for_symbol_and_aliases (sum_callers, &num_calls,
1771                                                true);
1772             if (num_calls == 1)
1773               info->single_caller = true;
1774             if (dfs && dfs->next_cycle)
1775               {
1776                 struct cgraph_node *n2;
1777                 int id = dfs->scc_no + 1;
1778                 for (n2 = node; n2;
1779                      n2 = ((struct ipa_dfs_info *) node->aux)->next_cycle)
1780                   {
1781                     struct inline_summary *info2 = inline_summaries->get (n2);
1782                     if (info2->scc_no)
1783                       break;
1784                     info2->scc_no = id;
1785                   }
1786               }
1787           }
1788
1789         for (edge = node->callers; edge; edge = edge->next_caller)
1790           if (max_count < edge->count)
1791             max_count = edge->count;
1792       }
1793   ipa_free_postorder_info ();
1794   initialize_growth_caches ();
1795
1796   if (dump_file)
1797     fprintf (dump_file,
1798              "\nDeciding on inlining of small functions.  Starting with size %i.\n",
1799              initial_size);
1800
1801   overall_size = initial_size;
1802   max_size = compute_max_insns (overall_size);
1803   min_size = overall_size;
1804
1805   /* Populate the heap with all edges we might inline.  */
1806
1807   FOR_EACH_DEFINED_FUNCTION (node)
1808     {
1809       bool update = false;
1810       struct cgraph_edge *next = NULL;
1811       bool has_speculative = false;
1812
1813       if (dump_file)
1814         fprintf (dump_file, "Enqueueing calls in %s/%i.\n",
1815                  node->name (), node->order);
1816
1817       for (edge = node->callees; edge; edge = next)
1818         {
1819           next = edge->next_callee;
1820           if (edge->inline_failed
1821               && !edge->aux
1822               && can_inline_edge_p (edge, true)
1823               && want_inline_small_function_p (edge, true)
1824               && edge->inline_failed)
1825             {
1826               gcc_assert (!edge->aux);
1827               update_edge_key (&edge_heap, edge);
1828             }
1829           if (edge->speculative)
1830             has_speculative = true;
1831         }
1832       if (has_speculative)
1833         for (edge = node->callees; edge; edge = next)
1834           if (edge->speculative && !speculation_useful_p (edge,
1835                                                           edge->aux != NULL))
1836             {
1837               edge->resolve_speculation ();
1838               update = true;
1839             }
1840       if (update)
1841         {
1842           struct cgraph_node *where = node->global.inlined_to
1843                                       ? node->global.inlined_to : node;
1844           inline_update_overall_summary (where);
1845           reset_edge_caches (where);
1846           update_caller_keys (&edge_heap, where,
1847                               updated_nodes, NULL);
1848           update_callee_keys (&edge_heap, where,
1849                               updated_nodes);
1850           bitmap_clear (updated_nodes);
1851         }
1852     }
1853
1854   gcc_assert (in_lto_p
1855               || !max_count
1856               || (profile_info && flag_branch_probabilities));
1857
1858   while (!edge_heap.empty ())
1859     {
1860       int old_size = overall_size;
1861       struct cgraph_node *where, *callee;
1862       sreal badness = edge_heap.min_key ();
1863       sreal current_badness;
1864       int growth;
1865
1866       edge = edge_heap.extract_min ();
1867       gcc_assert (edge->aux);
1868       edge->aux = NULL;
1869       if (!edge->inline_failed || !edge->callee->analyzed)
1870         continue;
1871
1872 #if CHECKING_P
1873       /* Be sure that caches are maintained consistent.  */
1874       sreal cached_badness = edge_badness (edge, false);
1875
1876       int old_size_est = estimate_edge_size (edge);
1877       sreal old_time_est = estimate_edge_time (edge);
1878       int old_hints_est = estimate_edge_hints (edge);
1879
1880       reset_edge_growth_cache (edge);
1881       gcc_assert (old_size_est == estimate_edge_size (edge));
1882       gcc_assert (old_time_est == estimate_edge_time (edge));
1883       /* FIXME:
1884
1885          gcc_assert (old_hints_est == estimate_edge_hints (edge));
1886
1887          fails with profile feedback because some hints depends on
1888          maybe_hot_edge_p predicate and because callee gets inlined to other
1889          calls, the edge may become cold.
1890          This ought to be fixed by computing relative probabilities
1891          for given invocation but that will be better done once whole
1892          code is converted to sreals.  Disable for now and revert to "wrong"
1893          value so enable/disable checking paths agree.  */
1894       edge_growth_cache[edge->uid].hints = old_hints_est + 1;
1895
1896       /* When updating the edge costs, we only decrease badness in the keys.
1897          Increases of badness are handled lazilly; when we see key with out
1898          of date value on it, we re-insert it now.  */
1899       current_badness = edge_badness (edge, false);
1900       /* Disable checking for profile because roundoff errors may cause slight
1901          deviations in the order.  */
1902       gcc_assert (max_count || cached_badness == current_badness);
1903       gcc_assert (current_badness >= badness);
1904 #else
1905       current_badness = edge_badness (edge, false);
1906 #endif
1907       if (current_badness != badness)
1908         {
1909           if (edge_heap.min () && current_badness > edge_heap.min_key ())
1910             {
1911               edge->aux = edge_heap.insert (current_badness, edge);
1912               continue;
1913             }
1914           else
1915             badness = current_badness;
1916         }
1917
1918       if (!can_inline_edge_p (edge, true))
1919         {
1920           resolve_noninline_speculation (&edge_heap, edge);
1921           continue;
1922         }
1923
1924       callee = edge->callee->ultimate_alias_target ();
1925       growth = estimate_edge_growth (edge);
1926       if (dump_file)
1927         {
1928           fprintf (dump_file,
1929                    "\nConsidering %s/%i with %i size\n",
1930                    callee->name (), callee->order,
1931                    inline_summaries->get (callee)->size);
1932           fprintf (dump_file,
1933                    " to be inlined into %s/%i in %s:%i\n"
1934                    " Estimated badness is %f, frequency %.2f.\n",
1935                    edge->caller->name (), edge->caller->order,
1936                    edge->call_stmt
1937                    && (LOCATION_LOCUS (gimple_location ((const gimple *)
1938                                                         edge->call_stmt))
1939                        > BUILTINS_LOCATION)
1940                    ? gimple_filename ((const gimple *) edge->call_stmt)
1941                    : "unknown",
1942                    edge->call_stmt
1943                    ? gimple_lineno ((const gimple *) edge->call_stmt)
1944                    : -1,
1945                    badness.to_double (),
1946                    edge->frequency / (double)CGRAPH_FREQ_BASE);
1947           if (edge->count)
1948             fprintf (dump_file," Called %" PRId64"x\n",
1949                      edge->count);
1950           if (dump_flags & TDF_DETAILS)
1951             edge_badness (edge, true);
1952         }
1953
1954       if (overall_size + growth > max_size
1955           && !DECL_DISREGARD_INLINE_LIMITS (callee->decl))
1956         {
1957           edge->inline_failed = CIF_INLINE_UNIT_GROWTH_LIMIT;
1958           report_inline_failed_reason (edge);
1959           resolve_noninline_speculation (&edge_heap, edge);
1960           continue;
1961         }
1962
1963       if (!want_inline_small_function_p (edge, true))
1964         {
1965           resolve_noninline_speculation (&edge_heap, edge);
1966           continue;
1967         }
1968
1969       /* Heuristics for inlining small functions work poorly for
1970          recursive calls where we do effects similar to loop unrolling.
1971          When inlining such edge seems profitable, leave decision on
1972          specific inliner.  */
1973       if (edge->recursive_p ())
1974         {
1975           where = edge->caller;
1976           if (where->global.inlined_to)
1977             where = where->global.inlined_to;
1978           if (!recursive_inlining (edge,
1979                                    opt_for_fn (edge->caller->decl,
1980                                                flag_indirect_inlining)
1981                                    ? &new_indirect_edges : NULL))
1982             {
1983               edge->inline_failed = CIF_RECURSIVE_INLINING;
1984               resolve_noninline_speculation (&edge_heap, edge);
1985               continue;
1986             }
1987           reset_edge_caches (where);
1988           /* Recursive inliner inlines all recursive calls of the function
1989              at once. Consequently we need to update all callee keys.  */
1990           if (opt_for_fn (edge->caller->decl, flag_indirect_inlining))
1991             add_new_edges_to_heap (&edge_heap, new_indirect_edges);
1992           update_callee_keys (&edge_heap, where, updated_nodes);
1993           bitmap_clear (updated_nodes);
1994         }
1995       else
1996         {
1997           struct cgraph_node *outer_node = NULL;
1998           int depth = 0;
1999
2000           /* Consider the case where self recursive function A is inlined
2001              into B.  This is desired optimization in some cases, since it
2002              leads to effect similar of loop peeling and we might completely
2003              optimize out the recursive call.  However we must be extra
2004              selective.  */
2005
2006           where = edge->caller;
2007           while (where->global.inlined_to)
2008             {
2009               if (where->decl == callee->decl)
2010                 outer_node = where, depth++;
2011               where = where->callers->caller;
2012             }
2013           if (outer_node
2014               && !want_inline_self_recursive_call_p (edge, outer_node,
2015                                                      true, depth))
2016             {
2017               edge->inline_failed
2018                 = (DECL_DISREGARD_INLINE_LIMITS (edge->callee->decl)
2019                    ? CIF_RECURSIVE_INLINING : CIF_UNSPECIFIED);
2020               resolve_noninline_speculation (&edge_heap, edge);
2021               continue;
2022             }
2023           else if (depth && dump_file)
2024             fprintf (dump_file, " Peeling recursion with depth %i\n", depth);
2025
2026           gcc_checking_assert (!callee->global.inlined_to);
2027           inline_call (edge, true, &new_indirect_edges, &overall_size, true);
2028           add_new_edges_to_heap (&edge_heap, new_indirect_edges);
2029
2030           reset_edge_caches (edge->callee);
2031
2032           update_callee_keys (&edge_heap, where, updated_nodes);
2033         }
2034       where = edge->caller;
2035       if (where->global.inlined_to)
2036         where = where->global.inlined_to;
2037
2038       /* Our profitability metric can depend on local properties
2039          such as number of inlinable calls and size of the function body.
2040          After inlining these properties might change for the function we
2041          inlined into (since it's body size changed) and for the functions
2042          called by function we inlined (since number of it inlinable callers
2043          might change).  */
2044       update_caller_keys (&edge_heap, where, updated_nodes, NULL);
2045       /* Offline copy count has possibly changed, recompute if profile is
2046          available.  */
2047       if (max_count)
2048         {
2049           struct cgraph_node *n = cgraph_node::get (edge->callee->decl);
2050           if (n != edge->callee && n->analyzed)
2051             update_callee_keys (&edge_heap, n, updated_nodes);
2052         }
2053       bitmap_clear (updated_nodes);
2054
2055       if (dump_file)
2056         {
2057           fprintf (dump_file,
2058                    " Inlined %s into %s which now has time %f and size %i, "
2059                    "net change of %+i.\n",
2060                    edge->callee->name (),
2061                    edge->caller->name (),
2062                    inline_summaries->get (edge->caller)->time.to_double (),
2063                    inline_summaries->get (edge->caller)->size,
2064                    overall_size - old_size);
2065         }
2066       if (min_size > overall_size)
2067         {
2068           min_size = overall_size;
2069           max_size = compute_max_insns (min_size);
2070
2071           if (dump_file)
2072             fprintf (dump_file, "New minimal size reached: %i\n", min_size);
2073         }
2074     }
2075
2076   free_growth_caches ();
2077   if (dump_file)
2078     fprintf (dump_file,
2079              "Unit growth for small function inlining: %i->%i (%i%%)\n",
2080              initial_size, overall_size,
2081              initial_size ? overall_size * 100 / (initial_size) - 100: 0);
2082   BITMAP_FREE (updated_nodes);
2083   symtab->remove_edge_removal_hook (edge_removal_hook_holder);
2084 }
2085
2086 /* Flatten NODE.  Performed both during early inlining and
2087    at IPA inlining time.  */
2088
2089 static void
2090 flatten_function (struct cgraph_node *node, bool early)
2091 {
2092   struct cgraph_edge *e;
2093
2094   /* We shouldn't be called recursively when we are being processed.  */
2095   gcc_assert (node->aux == NULL);
2096
2097   node->aux = (void *) node;
2098
2099   for (e = node->callees; e; e = e->next_callee)
2100     {
2101       struct cgraph_node *orig_callee;
2102       struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2103
2104       /* We've hit cycle?  It is time to give up.  */
2105       if (callee->aux)
2106         {
2107           if (dump_file)
2108             fprintf (dump_file,
2109                      "Not inlining %s into %s to avoid cycle.\n",
2110                      xstrdup_for_dump (callee->name ()),
2111                      xstrdup_for_dump (e->caller->name ()));
2112           e->inline_failed = CIF_RECURSIVE_INLINING;
2113           continue;
2114         }
2115
2116       /* When the edge is already inlined, we just need to recurse into
2117          it in order to fully flatten the leaves.  */
2118       if (!e->inline_failed)
2119         {
2120           flatten_function (callee, early);
2121           continue;
2122         }
2123
2124       /* Flatten attribute needs to be processed during late inlining. For
2125          extra code quality we however do flattening during early optimization,
2126          too.  */
2127       if (!early
2128           ? !can_inline_edge_p (e, true)
2129           : !can_early_inline_edge_p (e))
2130         continue;
2131
2132       if (e->recursive_p ())
2133         {
2134           if (dump_file)
2135             fprintf (dump_file, "Not inlining: recursive call.\n");
2136           continue;
2137         }
2138
2139       if (gimple_in_ssa_p (DECL_STRUCT_FUNCTION (node->decl))
2140           != gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->decl)))
2141         {
2142           if (dump_file)
2143             fprintf (dump_file, "Not inlining: SSA form does not match.\n");
2144           continue;
2145         }
2146
2147       /* Inline the edge and flatten the inline clone.  Avoid
2148          recursing through the original node if the node was cloned.  */
2149       if (dump_file)
2150         fprintf (dump_file, " Inlining %s into %s.\n",
2151                  xstrdup_for_dump (callee->name ()),
2152                  xstrdup_for_dump (e->caller->name ()));
2153       orig_callee = callee;
2154       inline_call (e, true, NULL, NULL, false);
2155       if (e->callee != orig_callee)
2156         orig_callee->aux = (void *) node;
2157       flatten_function (e->callee, early);
2158       if (e->callee != orig_callee)
2159         orig_callee->aux = NULL;
2160     }
2161
2162   node->aux = NULL;
2163   if (!node->global.inlined_to)
2164     inline_update_overall_summary (node);
2165 }
2166
2167 /* Inline NODE to all callers.  Worker for cgraph_for_node_and_aliases.
2168    DATA points to number of calls originally found so we avoid infinite
2169    recursion.  */
2170
2171 static bool
2172 inline_to_all_callers_1 (struct cgraph_node *node, void *data,
2173                          hash_set<cgraph_node *> *callers)
2174 {
2175   int *num_calls = (int *)data;
2176   bool callee_removed = false;
2177
2178   while (node->callers && !node->global.inlined_to)
2179     {
2180       struct cgraph_node *caller = node->callers->caller;
2181
2182       if (!can_inline_edge_p (node->callers, true)
2183           || node->callers->recursive_p ())
2184         {
2185           if (dump_file)
2186             fprintf (dump_file, "Uninlinable call found; giving up.\n");
2187           *num_calls = 0;
2188           return false;
2189         }
2190
2191       if (dump_file)
2192         {
2193           fprintf (dump_file,
2194                    "\nInlining %s size %i.\n",
2195                    node->name (),
2196                    inline_summaries->get (node)->size);
2197           fprintf (dump_file,
2198                    " Called once from %s %i insns.\n",
2199                    node->callers->caller->name (),
2200                    inline_summaries->get (node->callers->caller)->size);
2201         }
2202
2203       /* Remember which callers we inlined to, delaying updating the
2204          overall summary.  */
2205       callers->add (node->callers->caller);
2206       inline_call (node->callers, true, NULL, NULL, false, &callee_removed);
2207       if (dump_file)
2208         fprintf (dump_file,
2209                  " Inlined into %s which now has %i size\n",
2210                  caller->name (),
2211                  inline_summaries->get (caller)->size);
2212       if (!(*num_calls)--)
2213         {
2214           if (dump_file)
2215             fprintf (dump_file, "New calls found; giving up.\n");
2216           return callee_removed;
2217         }
2218       if (callee_removed)
2219         return true;
2220     }
2221   return false;
2222 }
2223
2224 /* Wrapper around inline_to_all_callers_1 doing delayed overall summary
2225    update.  */
2226
2227 static bool
2228 inline_to_all_callers (struct cgraph_node *node, void *data)
2229 {
2230   hash_set<cgraph_node *> callers;
2231   bool res = inline_to_all_callers_1 (node, data, &callers);
2232   /* Perform the delayed update of the overall summary of all callers
2233      processed.  This avoids quadratic behavior in the cases where
2234      we have a lot of calls to the same function.  */
2235   for (hash_set<cgraph_node *>::iterator i = callers.begin ();
2236        i != callers.end (); ++i)
2237     inline_update_overall_summary (*i);
2238   return res;
2239 }
2240
2241 /* Output overall time estimate.  */
2242 static void
2243 dump_overall_stats (void)
2244 {
2245   sreal sum_weighted = 0, sum = 0;
2246   struct cgraph_node *node;
2247
2248   FOR_EACH_DEFINED_FUNCTION (node)
2249     if (!node->global.inlined_to
2250         && !node->alias)
2251       {
2252         sreal time = inline_summaries->get (node)->time;
2253         sum += time;
2254         sum_weighted += time * node->count;
2255       }
2256   fprintf (dump_file, "Overall time estimate: "
2257            "%f weighted by profile: "
2258            "%f\n", sum.to_double (), sum_weighted.to_double ());
2259 }
2260
2261 /* Output some useful stats about inlining.  */
2262
2263 static void
2264 dump_inline_stats (void)
2265 {
2266   int64_t inlined_cnt = 0, inlined_indir_cnt = 0;
2267   int64_t inlined_virt_cnt = 0, inlined_virt_indir_cnt = 0;
2268   int64_t noninlined_cnt = 0, noninlined_indir_cnt = 0;
2269   int64_t noninlined_virt_cnt = 0, noninlined_virt_indir_cnt = 0;
2270   int64_t  inlined_speculative = 0, inlined_speculative_ply = 0;
2271   int64_t indirect_poly_cnt = 0, indirect_cnt = 0;
2272   int64_t reason[CIF_N_REASONS][3];
2273   int i;
2274   struct cgraph_node *node;
2275
2276   memset (reason, 0, sizeof (reason));
2277   FOR_EACH_DEFINED_FUNCTION (node)
2278   {
2279     struct cgraph_edge *e;
2280     for (e = node->callees; e; e = e->next_callee)
2281       {
2282         if (e->inline_failed)
2283           {
2284             reason[(int) e->inline_failed][0] += e->count;
2285             reason[(int) e->inline_failed][1] += e->frequency;
2286             reason[(int) e->inline_failed][2] ++;
2287             if (DECL_VIRTUAL_P (e->callee->decl))
2288               {
2289                 if (e->indirect_inlining_edge)
2290                   noninlined_virt_indir_cnt += e->count;
2291                 else
2292                   noninlined_virt_cnt += e->count;
2293               }
2294             else
2295               {
2296                 if (e->indirect_inlining_edge)
2297                   noninlined_indir_cnt += e->count;
2298                 else
2299                   noninlined_cnt += e->count;
2300               }
2301           }
2302         else
2303           {
2304             if (e->speculative)
2305               {
2306                 if (DECL_VIRTUAL_P (e->callee->decl))
2307                   inlined_speculative_ply += e->count;
2308                 else
2309                   inlined_speculative += e->count;
2310               }
2311             else if (DECL_VIRTUAL_P (e->callee->decl))
2312               {
2313                 if (e->indirect_inlining_edge)
2314                   inlined_virt_indir_cnt += e->count;
2315                 else
2316                   inlined_virt_cnt += e->count;
2317               }
2318             else
2319               {
2320                 if (e->indirect_inlining_edge)
2321                   inlined_indir_cnt += e->count;
2322                 else
2323                   inlined_cnt += e->count;
2324               }
2325           }
2326       }
2327     for (e = node->indirect_calls; e; e = e->next_callee)
2328       if (e->indirect_info->polymorphic)
2329         indirect_poly_cnt += e->count;
2330       else
2331         indirect_cnt += e->count;
2332   }
2333   if (max_count)
2334     {
2335       fprintf (dump_file,
2336                "Inlined %" PRId64 " + speculative "
2337                "%" PRId64 " + speculative polymorphic "
2338                "%" PRId64 " + previously indirect "
2339                "%" PRId64 " + virtual "
2340                "%" PRId64 " + virtual and previously indirect "
2341                "%" PRId64 "\n" "Not inlined "
2342                "%" PRId64 " + previously indirect "
2343                "%" PRId64 " + virtual "
2344                "%" PRId64 " + virtual and previously indirect "
2345                "%" PRId64 " + stil indirect "
2346                "%" PRId64 " + still indirect polymorphic "
2347                "%" PRId64 "\n", inlined_cnt,
2348                inlined_speculative, inlined_speculative_ply,
2349                inlined_indir_cnt, inlined_virt_cnt, inlined_virt_indir_cnt,
2350                noninlined_cnt, noninlined_indir_cnt, noninlined_virt_cnt,
2351                noninlined_virt_indir_cnt, indirect_cnt, indirect_poly_cnt);
2352       fprintf (dump_file,
2353                "Removed speculations %" PRId64 "\n",
2354                spec_rem);
2355     }
2356   dump_overall_stats ();
2357   fprintf (dump_file, "\nWhy inlining failed?\n");
2358   for (i = 0; i < CIF_N_REASONS; i++)
2359     if (reason[i][2])
2360       fprintf (dump_file, "%-50s: %8i calls, %8i freq, %" PRId64" count\n",
2361                cgraph_inline_failed_string ((cgraph_inline_failed_t) i),
2362                (int) reason[i][2], (int) reason[i][1], reason[i][0]);
2363 }
2364
2365 /* Decide on the inlining.  We do so in the topological order to avoid
2366    expenses on updating data structures.  */
2367
2368 static unsigned int
2369 ipa_inline (void)
2370 {
2371   struct cgraph_node *node;
2372   int nnodes;
2373   struct cgraph_node **order;
2374   int i;
2375   int cold;
2376   bool remove_functions = false;
2377
2378   if (!optimize)
2379     return 0;
2380
2381   cgraph_freq_base_rec = (sreal) 1 / (sreal) CGRAPH_FREQ_BASE;
2382   percent_rec = (sreal) 1 / (sreal) 100;
2383
2384   order = XCNEWVEC (struct cgraph_node *, symtab->cgraph_count);
2385
2386   if (in_lto_p && optimize)
2387     ipa_update_after_lto_read ();
2388
2389   if (dump_file)
2390     dump_inline_summaries (dump_file);
2391
2392   nnodes = ipa_reverse_postorder (order);
2393
2394   FOR_EACH_FUNCTION (node)
2395     {
2396       node->aux = 0;
2397
2398       /* Recompute the default reasons for inlining because they may have
2399          changed during merging.  */
2400       if (in_lto_p)
2401         {
2402           for (cgraph_edge *e = node->callees; e; e = e->next_callee)
2403             {
2404               gcc_assert (e->inline_failed);
2405               initialize_inline_failed (e);
2406             }
2407           for (cgraph_edge *e = node->indirect_calls; e; e = e->next_callee)
2408             initialize_inline_failed (e);
2409         }
2410     }
2411
2412   if (dump_file)
2413     fprintf (dump_file, "\nFlattening functions:\n");
2414
2415   /* In the first pass handle functions to be flattened.  Do this with
2416      a priority so none of our later choices will make this impossible.  */
2417   for (i = nnodes - 1; i >= 0; i--)
2418     {
2419       node = order[i];
2420
2421       /* Handle nodes to be flattened.
2422          Ideally when processing callees we stop inlining at the
2423          entry of cycles, possibly cloning that entry point and
2424          try to flatten itself turning it into a self-recursive
2425          function.  */
2426       if (lookup_attribute ("flatten",
2427                             DECL_ATTRIBUTES (node->decl)) != NULL)
2428         {
2429           if (dump_file)
2430             fprintf (dump_file,
2431                      "Flattening %s\n", node->name ());
2432           flatten_function (node, false);
2433         }
2434     }
2435   if (dump_file)
2436     dump_overall_stats ();
2437
2438   inline_small_functions ();
2439
2440   gcc_assert (symtab->state == IPA_SSA);
2441   symtab->state = IPA_SSA_AFTER_INLINING;
2442   /* Do first after-inlining removal.  We want to remove all "stale" extern
2443      inline functions and virtual functions so we really know what is called
2444      once.  */
2445   symtab->remove_unreachable_nodes (dump_file);
2446   free (order);
2447
2448   /* Inline functions with a property that after inlining into all callers the
2449      code size will shrink because the out-of-line copy is eliminated.
2450      We do this regardless on the callee size as long as function growth limits
2451      are met.  */
2452   if (dump_file)
2453     fprintf (dump_file,
2454              "\nDeciding on functions to be inlined into all callers and "
2455              "removing useless speculations:\n");
2456
2457   /* Inlining one function called once has good chance of preventing
2458      inlining other function into the same callee.  Ideally we should
2459      work in priority order, but probably inlining hot functions first
2460      is good cut without the extra pain of maintaining the queue.
2461
2462      ??? this is not really fitting the bill perfectly: inlining function
2463      into callee often leads to better optimization of callee due to
2464      increased context for optimization.
2465      For example if main() function calls a function that outputs help
2466      and then function that does the main optmization, we should inline
2467      the second with priority even if both calls are cold by themselves.
2468
2469      We probably want to implement new predicate replacing our use of
2470      maybe_hot_edge interpreted as maybe_hot_edge || callee is known
2471      to be hot.  */
2472   for (cold = 0; cold <= 1; cold ++)
2473     {
2474       FOR_EACH_DEFINED_FUNCTION (node)
2475         {
2476           struct cgraph_edge *edge, *next;
2477           bool update=false;
2478
2479           for (edge = node->callees; edge; edge = next)
2480             {
2481               next = edge->next_callee;
2482               if (edge->speculative && !speculation_useful_p (edge, false))
2483                 {
2484                   edge->resolve_speculation ();
2485                   spec_rem += edge->count;
2486                   update = true;
2487                   remove_functions = true;
2488                 }
2489             }
2490           if (update)
2491             {
2492               struct cgraph_node *where = node->global.inlined_to
2493                                           ? node->global.inlined_to : node;
2494               reset_edge_caches (where);
2495               inline_update_overall_summary (where);
2496             }
2497           if (want_inline_function_to_all_callers_p (node, cold))
2498             {
2499               int num_calls = 0;
2500               node->call_for_symbol_and_aliases (sum_callers, &num_calls,
2501                                                  true);
2502               while (node->call_for_symbol_and_aliases
2503                        (inline_to_all_callers, &num_calls, true))
2504                 ;
2505               remove_functions = true;
2506             }
2507         }
2508     }
2509
2510   /* Free ipa-prop structures if they are no longer needed.  */
2511   if (optimize)
2512     ipa_free_all_structures_after_iinln ();
2513
2514   if (dump_file)
2515     {
2516       fprintf (dump_file,
2517                "\nInlined %i calls, eliminated %i functions\n\n",
2518                ncalls_inlined, nfunctions_inlined);
2519       dump_inline_stats ();
2520     }
2521
2522   if (dump_file)
2523     dump_inline_summaries (dump_file);
2524   /* In WPA we use inline summaries for partitioning process.  */
2525   if (!flag_wpa)
2526     inline_free_summary ();
2527   return remove_functions ? TODO_remove_functions : 0;
2528 }
2529
2530 /* Inline always-inline function calls in NODE.  */
2531
2532 static bool
2533 inline_always_inline_functions (struct cgraph_node *node)
2534 {
2535   struct cgraph_edge *e;
2536   bool inlined = false;
2537
2538   for (e = node->callees; e; e = e->next_callee)
2539     {
2540       struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2541       if (!DECL_DISREGARD_INLINE_LIMITS (callee->decl))
2542         continue;
2543
2544       if (e->recursive_p ())
2545         {
2546           if (dump_file)
2547             fprintf (dump_file, "  Not inlining recursive call to %s.\n",
2548                      e->callee->name ());
2549           e->inline_failed = CIF_RECURSIVE_INLINING;
2550           continue;
2551         }
2552
2553       if (!can_early_inline_edge_p (e))
2554         {
2555           /* Set inlined to true if the callee is marked "always_inline" but
2556              is not inlinable.  This will allow flagging an error later in
2557              expand_call_inline in tree-inline.c.  */
2558           if (lookup_attribute ("always_inline",
2559                                  DECL_ATTRIBUTES (callee->decl)) != NULL)
2560             inlined = true;
2561           continue;
2562         }
2563
2564       if (dump_file)
2565         fprintf (dump_file, "  Inlining %s into %s (always_inline).\n",
2566                  xstrdup_for_dump (e->callee->name ()),
2567                  xstrdup_for_dump (e->caller->name ()));
2568       inline_call (e, true, NULL, NULL, false);
2569       inlined = true;
2570     }
2571   if (inlined)
2572     inline_update_overall_summary (node);
2573
2574   return inlined;
2575 }
2576
2577 /* Decide on the inlining.  We do so in the topological order to avoid
2578    expenses on updating data structures.  */
2579
2580 static bool
2581 early_inline_small_functions (struct cgraph_node *node)
2582 {
2583   struct cgraph_edge *e;
2584   bool inlined = false;
2585
2586   for (e = node->callees; e; e = e->next_callee)
2587     {
2588       struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2589       if (!inline_summaries->get (callee)->inlinable
2590           || !e->inline_failed)
2591         continue;
2592
2593       /* Do not consider functions not declared inline.  */
2594       if (!DECL_DECLARED_INLINE_P (callee->decl)
2595           && !opt_for_fn (node->decl, flag_inline_small_functions)
2596           && !opt_for_fn (node->decl, flag_inline_functions))
2597         continue;
2598
2599       if (dump_file)
2600         fprintf (dump_file, "Considering inline candidate %s.\n",
2601                  callee->name ());
2602
2603       if (!can_early_inline_edge_p (e))
2604         continue;
2605
2606       if (e->recursive_p ())
2607         {
2608           if (dump_file)
2609             fprintf (dump_file, "  Not inlining: recursive call.\n");
2610           continue;
2611         }
2612
2613       if (!want_early_inline_function_p (e))
2614         continue;
2615
2616       if (dump_file)
2617         fprintf (dump_file, " Inlining %s into %s.\n",
2618                  xstrdup_for_dump (callee->name ()),
2619                  xstrdup_for_dump (e->caller->name ()));
2620       inline_call (e, true, NULL, NULL, false);
2621       inlined = true;
2622     }
2623
2624   if (inlined)
2625     inline_update_overall_summary (node);
2626
2627   return inlined;
2628 }
2629
2630 unsigned int
2631 early_inliner (function *fun)
2632 {
2633   struct cgraph_node *node = cgraph_node::get (current_function_decl);
2634   struct cgraph_edge *edge;
2635   unsigned int todo = 0;
2636   int iterations = 0;
2637   bool inlined = false;
2638
2639   if (seen_error ())
2640     return 0;
2641
2642   /* Do nothing if datastructures for ipa-inliner are already computed.  This
2643      happens when some pass decides to construct new function and
2644      cgraph_add_new_function calls lowering passes and early optimization on
2645      it.  This may confuse ourself when early inliner decide to inline call to
2646      function clone, because function clones don't have parameter list in
2647      ipa-prop matching their signature.  */
2648   if (ipa_node_params_sum)
2649     return 0;
2650
2651   if (flag_checking)
2652     node->verify ();
2653   node->remove_all_references ();
2654
2655   /* Rebuild this reference because it dosn't depend on
2656      function's body and it's required to pass cgraph_node
2657      verification.  */
2658   if (node->instrumented_version
2659       && !node->instrumentation_clone)
2660     node->create_reference (node->instrumented_version, IPA_REF_CHKP, NULL);
2661
2662   /* Even when not optimizing or not inlining inline always-inline
2663      functions.  */
2664   inlined = inline_always_inline_functions (node);
2665
2666   if (!optimize
2667       || flag_no_inline
2668       || !flag_early_inlining
2669       /* Never inline regular functions into always-inline functions
2670          during incremental inlining.  This sucks as functions calling
2671          always inline functions will get less optimized, but at the
2672          same time inlining of functions calling always inline
2673          function into an always inline function might introduce
2674          cycles of edges to be always inlined in the callgraph.
2675
2676          We might want to be smarter and just avoid this type of inlining.  */
2677       || (DECL_DISREGARD_INLINE_LIMITS (node->decl)
2678           && lookup_attribute ("always_inline",
2679                                DECL_ATTRIBUTES (node->decl))))
2680     ;
2681   else if (lookup_attribute ("flatten",
2682                              DECL_ATTRIBUTES (node->decl)) != NULL)
2683     {
2684       /* When the function is marked to be flattened, recursively inline
2685          all calls in it.  */
2686       if (dump_file)
2687         fprintf (dump_file,
2688                  "Flattening %s\n", node->name ());
2689       flatten_function (node, true);
2690       inlined = true;
2691     }
2692   else
2693     {
2694       /* If some always_inline functions was inlined, apply the changes.
2695          This way we will not account always inline into growth limits and
2696          moreover we will inline calls from always inlines that we skipped
2697          previously because of conditional above.  */
2698       if (inlined)
2699         {
2700           timevar_push (TV_INTEGRATION);
2701           todo |= optimize_inline_calls (current_function_decl);
2702           /* optimize_inline_calls call above might have introduced new
2703              statements that don't have inline parameters computed.  */
2704           for (edge = node->callees; edge; edge = edge->next_callee)
2705             {
2706               if (inline_edge_summary_vec.length () > (unsigned) edge->uid)
2707                 {
2708                   struct inline_edge_summary *es = inline_edge_summary (edge);
2709                   es->call_stmt_size
2710                     = estimate_num_insns (edge->call_stmt, &eni_size_weights);
2711                   es->call_stmt_time
2712                     = estimate_num_insns (edge->call_stmt, &eni_time_weights);
2713                 }
2714             }
2715           inline_update_overall_summary (node);
2716           inlined = false;
2717           timevar_pop (TV_INTEGRATION);
2718         }
2719       /* We iterate incremental inlining to get trivial cases of indirect
2720          inlining.  */
2721       while (iterations < PARAM_VALUE (PARAM_EARLY_INLINER_MAX_ITERATIONS)
2722              && early_inline_small_functions (node))
2723         {
2724           timevar_push (TV_INTEGRATION);
2725           todo |= optimize_inline_calls (current_function_decl);
2726
2727           /* Technically we ought to recompute inline parameters so the new
2728              iteration of early inliner works as expected.  We however have
2729              values approximately right and thus we only need to update edge
2730              info that might be cleared out for newly discovered edges.  */
2731           for (edge = node->callees; edge; edge = edge->next_callee)
2732             {
2733               /* We have no summary for new bound store calls yet.  */
2734               if (inline_edge_summary_vec.length () > (unsigned)edge->uid)
2735                 {
2736                   struct inline_edge_summary *es = inline_edge_summary (edge);
2737                   es->call_stmt_size
2738                     = estimate_num_insns (edge->call_stmt, &eni_size_weights);
2739                   es->call_stmt_time
2740                     = estimate_num_insns (edge->call_stmt, &eni_time_weights);
2741                 }
2742               if (edge->callee->decl
2743                   && !gimple_check_call_matching_types (
2744                       edge->call_stmt, edge->callee->decl, false))
2745                 {
2746                   edge->inline_failed = CIF_MISMATCHED_ARGUMENTS;
2747                   edge->call_stmt_cannot_inline_p = true;
2748                 }
2749             }
2750           if (iterations < PARAM_VALUE (PARAM_EARLY_INLINER_MAX_ITERATIONS) - 1)
2751             inline_update_overall_summary (node);
2752           timevar_pop (TV_INTEGRATION);
2753           iterations++;
2754           inlined = false;
2755         }
2756       if (dump_file)
2757         fprintf (dump_file, "Iterations: %i\n", iterations);
2758     }
2759
2760   if (inlined)
2761     {
2762       timevar_push (TV_INTEGRATION);
2763       todo |= optimize_inline_calls (current_function_decl);
2764       timevar_pop (TV_INTEGRATION);
2765     }
2766
2767   fun->always_inline_functions_inlined = true;
2768
2769   return todo;
2770 }
2771
2772 /* Do inlining of small functions.  Doing so early helps profiling and other
2773    passes to be somewhat more effective and avoids some code duplication in
2774    later real inlining pass for testcases with very many function calls.  */
2775
2776 namespace {
2777
2778 const pass_data pass_data_early_inline =
2779 {
2780   GIMPLE_PASS, /* type */
2781   "einline", /* name */
2782   OPTGROUP_INLINE, /* optinfo_flags */
2783   TV_EARLY_INLINING, /* tv_id */
2784   PROP_ssa, /* properties_required */
2785   0, /* properties_provided */
2786   0, /* properties_destroyed */
2787   0, /* todo_flags_start */
2788   0, /* todo_flags_finish */
2789 };
2790
2791 class pass_early_inline : public gimple_opt_pass
2792 {
2793 public:
2794   pass_early_inline (gcc::context *ctxt)
2795     : gimple_opt_pass (pass_data_early_inline, ctxt)
2796   {}
2797
2798   /* opt_pass methods: */
2799   virtual unsigned int execute (function *);
2800
2801 }; // class pass_early_inline
2802
2803 unsigned int
2804 pass_early_inline::execute (function *fun)
2805 {
2806   return early_inliner (fun);
2807 }
2808
2809 } // anon namespace
2810
2811 gimple_opt_pass *
2812 make_pass_early_inline (gcc::context *ctxt)
2813 {
2814   return new pass_early_inline (ctxt);
2815 }
2816
2817 namespace {
2818
2819 const pass_data pass_data_ipa_inline =
2820 {
2821   IPA_PASS, /* type */
2822   "inline", /* name */
2823   OPTGROUP_INLINE, /* optinfo_flags */
2824   TV_IPA_INLINING, /* tv_id */
2825   0, /* properties_required */
2826   0, /* properties_provided */
2827   0, /* properties_destroyed */
2828   0, /* todo_flags_start */
2829   ( TODO_dump_symtab ), /* todo_flags_finish */
2830 };
2831
2832 class pass_ipa_inline : public ipa_opt_pass_d
2833 {
2834 public:
2835   pass_ipa_inline (gcc::context *ctxt)
2836     : ipa_opt_pass_d (pass_data_ipa_inline, ctxt,
2837                       inline_generate_summary, /* generate_summary */
2838                       inline_write_summary, /* write_summary */
2839                       inline_read_summary, /* read_summary */
2840                       NULL, /* write_optimization_summary */
2841                       NULL, /* read_optimization_summary */
2842                       NULL, /* stmt_fixup */
2843                       0, /* function_transform_todo_flags_start */
2844                       inline_transform, /* function_transform */
2845                       NULL) /* variable_transform */
2846   {}
2847
2848   /* opt_pass methods: */
2849   virtual unsigned int execute (function *) { return ipa_inline (); }
2850
2851 }; // class pass_ipa_inline
2852
2853 } // anon namespace
2854
2855 ipa_opt_pass_d *
2856 make_pass_ipa_inline (gcc::context *ctxt)
2857 {
2858   return new pass_ipa_inline (ctxt);
2859 }