gcc/ipa-inline.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003-2013 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /*  Inlining decision heuristics
  22
  23     The implementation of inliner is organized as follows:
  24
  25     inlining heuristics limits
  26
  27       can_inline_edge_p allow to check that particular inlining is allowed
  28       by the limits specified by user (allowed function growth, growth and so
  29       on).
  30
  31       Functions are inlined when it is obvious the result is profitable (such
  32       as functions called once or when inlining reduce code size).
  33       In addition to that we perform inlining of small functions and recursive
  34       inlining.
  35
  36     inlining heuristics
  37
  38        The inliner itself is split into two passes:
  39
  40        pass_early_inlining
  41
  42          Simple local inlining pass inlining callees into current function.
  43          This pass makes no use of whole unit analysis and thus it can do only
  44          very simple decisions based on local properties.
  45
  46          The strength of the pass is that it is run in topological order
  47          (reverse postorder) on the callgraph. Functions are converted into SSA
  48          form just before this pass and optimized subsequently. As a result, the
  49          callees of the function seen by the early inliner was already optimized
  50          and results of early inlining adds a lot of optimization opportunities
  51          for the local optimization.
  52
  53          The pass handle the obvious inlining decisions within the compilation
  54          unit - inlining auto inline functions, inlining for size and
  55          flattening.
  56
  57          main strength of the pass is the ability to eliminate abstraction
  58          penalty in C++ code (via combination of inlining and early
  59          optimization) and thus improve quality of analysis done by real IPA
  60          optimizers.
  61
  62          Because of lack of whole unit knowledge, the pass can not really make
  63          good code size/performance tradeoffs.  It however does very simple
  64          speculative inlining allowing code size to grow by
  65          EARLY_INLINING_INSNS when callee is leaf function.  In this case the
  66          optimizations performed later are very likely to eliminate the cost.
  67
  68        pass_ipa_inline
  69
  70          This is the real inliner able to handle inlining with whole program
  71          knowledge. It performs following steps:
  72
  73          1) inlining of small functions.  This is implemented by greedy
  74          algorithm ordering all inlinable cgraph edges by their badness and
  75          inlining them in this order as long as inline limits allows doing so.
  76
  77          This heuristics is not very good on inlining recursive calls. Recursive
  78          calls can be inlined with results similar to loop unrolling. To do so,
  79          special purpose recursive inliner is executed on function when
  80          recursive edge is met as viable candidate.
  81
  82          2) Unreachable functions are removed from callgraph.  Inlining leads
  83          to devirtualization and other modification of callgraph so functions
  84          may become unreachable during the process. Also functions declared as
  85          extern inline or virtual functions are removed, since after inlining
  86          we no longer need the offline bodies.
  87
  88          3) Functions called once and not exported from the unit are inlined.
  89          This should almost always lead to reduction of code size by eliminating
  90          the need for offline copy of the function.  */
  91
  92 #include "config.h"
  93 #include "system.h"
  94 #include "coretypes.h"
  95 #include "tm.h"
  96 #include "tree.h"
  97 #include "tree-inline.h"
  98 #include "langhooks.h"
  99 #include "flags.h"
 100 #include "cgraph.h"
 101 #include "diagnostic.h"
 102 #include "gimple-pretty-print.h"
 103 #include "params.h"
 104 #include "fibheap.h"
 105 #include "intl.h"
 106 #include "tree-pass.h"
 107 #include "coverage.h"
 108 #include "ggc.h"
 109 #include "rtl.h"
 110 #include "tree-flow.h"
 111 #include "ipa-prop.h"
 112 #include "except.h"
 113 #include "target.h"
 114 #include "ipa-inline.h"
 115 #include "ipa-utils.h"
 116
 117 /* Statistics we collect about inlining algorithm.  */
 118 static int overall_size;
 119 static gcov_type max_count;
 120
 121 /* Return false when inlining edge E would lead to violating
 122    limits on function unit growth or stack usage growth.
 123
 124    The relative function body growth limit is present generally
 125    to avoid problems with non-linear behavior of the compiler.
 126    To allow inlining huge functions into tiny wrapper, the limit
 127    is always based on the bigger of the two functions considered.
 128
 129    For stack growth limits we always base the growth in stack usage
 130    of the callers.  We want to prevent applications from segfaulting
 131    on stack overflow when functions with huge stack frames gets
 132    inlined. */
 133
 134 static bool
 135 caller_growth_limits (struct cgraph_edge *e)
 136 {
 137   struct cgraph_node *to = e->caller;
 138   struct cgraph_node *what = cgraph_function_or_thunk_node (e->callee, NULL);
 139   int newsize;
 140   int limit = 0;
 141   HOST_WIDE_INT stack_size_limit = 0, inlined_stack;
 142   struct inline_summary *info, *what_info, *outer_info = inline_summary (to);
 143
 144   /* Look for function e->caller is inlined to.  While doing
 145      so work out the largest function body on the way.  As
 146      described above, we want to base our function growth
 147      limits based on that.  Not on the self size of the
 148      outer function, not on the self size of inline code
 149      we immediately inline to.  This is the most relaxed
 150      interpretation of the rule "do not grow large functions
 151      too much in order to prevent compiler from exploding".  */
 152   while (true)
 153     {
 154       info = inline_summary (to);
 155       if (limit < info->self_size)
 156         limit = info->self_size;
 157       if (stack_size_limit < info->estimated_self_stack_size)
 158         stack_size_limit = info->estimated_self_stack_size;
 159       if (to->global.inlined_to)
 160         to = to->callers->caller;
 161       else
 162         break;
 163     }
 164
 165   what_info = inline_summary (what);
 166
 167   if (limit < what_info->self_size)
 168     limit = what_info->self_size;
 169
 170   limit += limit * PARAM_VALUE (PARAM_LARGE_FUNCTION_GROWTH) / 100;
 171
 172   /* Check the size after inlining against the function limits.  But allow
 173      the function to shrink if it went over the limits by forced inlining.  */
 174   newsize = estimate_size_after_inlining (to, e);
 175   if (newsize >= info->size
 176       && newsize > PARAM_VALUE (PARAM_LARGE_FUNCTION_INSNS)
 177       && newsize > limit)
 178     {
 179       e->inline_failed = CIF_LARGE_FUNCTION_GROWTH_LIMIT;
 180       return false;
 181     }
 182
 183   if (!what_info->estimated_stack_size)
 184     return true;
 185
 186   /* FIXME: Stack size limit often prevents inlining in Fortran programs
 187      due to large i/o datastructures used by the Fortran front-end.
 188      We ought to ignore this limit when we know that the edge is executed
 189      on every invocation of the caller (i.e. its call statement dominates
 190      exit block).  We do not track this information, yet.  */
 191   stack_size_limit += ((gcov_type)stack_size_limit
 192                        * PARAM_VALUE (PARAM_STACK_FRAME_GROWTH) / 100);
 193
 194   inlined_stack = (outer_info->stack_frame_offset
 195                    + outer_info->estimated_self_stack_size
 196                    + what_info->estimated_stack_size);
 197   /* Check new stack consumption with stack consumption at the place
 198      stack is used.  */
 199   if (inlined_stack > stack_size_limit
 200       /* If function already has large stack usage from sibling
 201          inline call, we can inline, too.
 202          This bit overoptimistically assume that we are good at stack
 203          packing.  */
 204       && inlined_stack > info->estimated_stack_size
 205       && inlined_stack > PARAM_VALUE (PARAM_LARGE_STACK_FRAME))
 206     {
 207       e->inline_failed = CIF_LARGE_STACK_FRAME_GROWTH_LIMIT;
 208       return false;
 209     }
 210   return true;
 211 }
 212
 213 /* Dump info about why inlining has failed.  */
 214
 215 static void
 216 report_inline_failed_reason (struct cgraph_edge *e)
 217 {
 218   if (dump_file)
 219     {
 220       fprintf (dump_file, "  not inlinable: %s/%i -> %s/%i, %s\n",
 221                xstrdup (cgraph_node_name (e->caller)), e->caller->symbol.order,
 222                xstrdup (cgraph_node_name (e->callee)), e->callee->symbol.order,
 223                cgraph_inline_failed_string (e->inline_failed));
 224     }
 225 }
 226
 227 /* Decide if we can inline the edge and possibly update
 228    inline_failed reason.
 229    We check whether inlining is possible at all and whether
 230    caller growth limits allow doing so.
 231
 232    if REPORT is true, output reason to the dump file.
 233
 234    if DISREGARD_LIMITES is true, ignore size limits.*/
 235
 236 static bool
 237 can_inline_edge_p (struct cgraph_edge *e, bool report,
 238                    bool disregard_limits = false)
 239 {
 240   bool inlinable = true;
 241   enum availability avail;
 242   struct cgraph_node *callee
 243     = cgraph_function_or_thunk_node (e->callee, &avail);
 244   tree caller_tree = DECL_FUNCTION_SPECIFIC_OPTIMIZATION (e->caller->symbol.decl);
 245   tree callee_tree
 246     = callee ? DECL_FUNCTION_SPECIFIC_OPTIMIZATION (callee->symbol.decl) : NULL;
 247   struct function *caller_cfun = DECL_STRUCT_FUNCTION (e->caller->symbol.decl);
 248   struct function *callee_cfun
 249     = callee ? DECL_STRUCT_FUNCTION (callee->symbol.decl) : NULL;
 250
 251   if (!caller_cfun && e->caller->clone_of)
 252     caller_cfun = DECL_STRUCT_FUNCTION (e->caller->clone_of->symbol.decl);
 253
 254   if (!callee_cfun && callee && callee->clone_of)
 255     callee_cfun = DECL_STRUCT_FUNCTION (callee->clone_of->symbol.decl);
 256
 257   gcc_assert (e->inline_failed);
 258
 259   if (!callee || !callee->symbol.definition)
 260     {
 261       e->inline_failed = CIF_BODY_NOT_AVAILABLE;
 262       inlinable = false;
 263     }
 264   else if (!inline_summary (callee)->inlinable)
 265     {
 266       e->inline_failed = CIF_FUNCTION_NOT_INLINABLE;
 267       inlinable = false;
 268     }
 269   else if (avail <= AVAIL_OVERWRITABLE)
 270     {
 271       e->inline_failed = CIF_OVERWRITABLE;
 272       inlinable = false;
 273     }
 274   else if (e->call_stmt_cannot_inline_p)
 275     {
 276       e->inline_failed = CIF_MISMATCHED_ARGUMENTS;
 277       inlinable = false;
 278     }
 279   /* Don't inline if the functions have different EH personalities.  */
 280   else if (DECL_FUNCTION_PERSONALITY (e->caller->symbol.decl)
 281            && DECL_FUNCTION_PERSONALITY (callee->symbol.decl)
 282            && (DECL_FUNCTION_PERSONALITY (e->caller->symbol.decl)
 283                != DECL_FUNCTION_PERSONALITY (callee->symbol.decl)))
 284     {
 285       e->inline_failed = CIF_EH_PERSONALITY;
 286       inlinable = false;
 287     }
 288   /* TM pure functions should not be inlined into non-TM_pure
 289      functions.  */
 290   else if (is_tm_pure (callee->symbol.decl)
 291            && !is_tm_pure (e->caller->symbol.decl))
 292     {
 293       e->inline_failed = CIF_UNSPECIFIED;
 294       inlinable = false;
 295     }
 296   /* Don't inline if the callee can throw non-call exceptions but the
 297      caller cannot.
 298      FIXME: this is obviously wrong for LTO where STRUCT_FUNCTION is missing.
 299      Move the flag into cgraph node or mirror it in the inline summary.  */
 300   else if (callee_cfun && callee_cfun->can_throw_non_call_exceptions
 301            && !(caller_cfun && caller_cfun->can_throw_non_call_exceptions))
 302     {
 303       e->inline_failed = CIF_NON_CALL_EXCEPTIONS;
 304       inlinable = false;
 305     }
 306   /* Check compatibility of target optimization options.  */
 307   else if (!targetm.target_option.can_inline_p (e->caller->symbol.decl,
 308                                                 callee->symbol.decl))
 309     {
 310       e->inline_failed = CIF_TARGET_OPTION_MISMATCH;
 311       inlinable = false;
 312     }
 313   /* Check if caller growth allows the inlining.  */
 314   else if (!DECL_DISREGARD_INLINE_LIMITS (callee->symbol.decl)
 315            && !disregard_limits
 316            && !lookup_attribute ("flatten",
 317                                  DECL_ATTRIBUTES
 318                                    (e->caller->global.inlined_to
 319                                     ? e->caller->global.inlined_to->symbol.decl
 320                                     : e->caller->symbol.decl))
 321            && !caller_growth_limits (e))
 322     inlinable = false;
 323   /* Don't inline a function with a higher optimization level than the
 324      caller.  FIXME: this is really just tip of iceberg of handling
 325      optimization attribute.  */
 326   else if (caller_tree != callee_tree)
 327     {
 328       struct cl_optimization *caller_opt
 329         = TREE_OPTIMIZATION ((caller_tree)
 330                              ? caller_tree
 331                              : optimization_default_node);
 332
 333       struct cl_optimization *callee_opt
 334         = TREE_OPTIMIZATION ((callee_tree)
 335                              ? callee_tree
 336                              : optimization_default_node);
 337
 338       if (((caller_opt->x_optimize > callee_opt->x_optimize)
 339            || (caller_opt->x_optimize_size != callee_opt->x_optimize_size))
 340           /* gcc.dg/pr43564.c.  Look at forced inline even in -O0.  */
 341           && !DECL_DISREGARD_INLINE_LIMITS (e->callee->symbol.decl))
 342         {
 343           e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
 344           inlinable = false;
 345         }
 346     }
 347
 348   if (!inlinable && report)
 349     report_inline_failed_reason (e);
 350   return inlinable;
 351 }
 352
 353
 354 /* Return true if the edge E is inlinable during early inlining.  */
 355
 356 static bool
 357 can_early_inline_edge_p (struct cgraph_edge *e)
 358 {
 359   struct cgraph_node *callee = cgraph_function_or_thunk_node (e->callee,
 360                                                               NULL);
 361   /* Early inliner might get called at WPA stage when IPA pass adds new
 362      function.  In this case we can not really do any of early inlining
 363      because function bodies are missing.  */
 364   if (!gimple_has_body_p (callee->symbol.decl))
 365     {
 366       e->inline_failed = CIF_BODY_NOT_AVAILABLE;
 367       return false;
 368     }
 369   /* In early inliner some of callees may not be in SSA form yet
 370      (i.e. the callgraph is cyclic and we did not process
 371      the callee by early inliner, yet).  We don't have CIF code for this
 372      case; later we will re-do the decision in the real inliner.  */
 373   if (!gimple_in_ssa_p (DECL_STRUCT_FUNCTION (e->caller->symbol.decl))
 374       || !gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->symbol.decl)))
 375     {
 376       if (dump_file)
 377         fprintf (dump_file, "  edge not inlinable: not in SSA form\n");
 378       return false;
 379     }
 380   if (!can_inline_edge_p (e, true))
 381     return false;
 382   return true;
 383 }
 384
 385
 386 /* Return number of calls in N.  Ignore cheap builtins.  */
 387
 388 static int
 389 num_calls (struct cgraph_node *n)
 390 {
 391   struct cgraph_edge *e;
 392   int num = 0;
 393
 394   for (e = n->callees; e; e = e->next_callee)
 395     if (!is_inexpensive_builtin (e->callee->symbol.decl))
 396       num++;
 397   return num;
 398 }
 399
 400
 401 /* Return true if we are interested in inlining small function.  */
 402
 403 static bool
 404 want_early_inline_function_p (struct cgraph_edge *e)
 405 {
 406   bool want_inline = true;
 407   struct cgraph_node *callee = cgraph_function_or_thunk_node (e->callee, NULL);
 408
 409   if (DECL_DISREGARD_INLINE_LIMITS (callee->symbol.decl))
 410     ;
 411   else if (!DECL_DECLARED_INLINE_P (callee->symbol.decl)
 412            && !flag_inline_small_functions)
 413     {
 414       e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
 415       report_inline_failed_reason (e);
 416       want_inline = false;
 417     }
 418   else
 419     {
 420       int growth = estimate_edge_growth (e);
 421       int n;
 422
 423       if (growth <= 0)
 424         ;
 425       else if (!cgraph_maybe_hot_edge_p (e)
 426                && growth > 0)
 427         {
 428           if (dump_file)
 429             fprintf (dump_file, "  will not early inline: %s/%i->%s/%i, "
 430                      "call is cold and code would grow by %i\n",
 431                      xstrdup (cgraph_node_name (e->caller)),
 432                      e->caller->symbol.order,
 433                      xstrdup (cgraph_node_name (callee)), callee->symbol.order,
 434                      growth);
 435           want_inline = false;
 436         }
 437       else if (growth > PARAM_VALUE (PARAM_EARLY_INLINING_INSNS))
 438         {
 439           if (dump_file)
 440             fprintf (dump_file, "  will not early inline: %s/%i->%s/%i, "
 441                      "growth %i exceeds --param early-inlining-insns\n",
 442                      xstrdup (cgraph_node_name (e->caller)),
 443                      e->caller->symbol.order,
 444                      xstrdup (cgraph_node_name (callee)), callee->symbol.order,
 445                      growth);
 446           want_inline = false;
 447         }
 448       else if ((n = num_calls (callee)) != 0
 449                && growth * (n + 1) > PARAM_VALUE (PARAM_EARLY_INLINING_INSNS))
 450         {
 451           if (dump_file)
 452             fprintf (dump_file, "  will not early inline: %s/%i->%s/%i, "
 453                      "growth %i exceeds --param early-inlining-insns "
 454                      "divided by number of calls\n",
 455                      xstrdup (cgraph_node_name (e->caller)),
 456                      e->caller->symbol.order,
 457                      xstrdup (cgraph_node_name (callee)), callee->symbol.order,
 458                      growth);
 459           want_inline = false;
 460         }
 461     }
 462   return want_inline;
 463 }
 464
 465 /* Compute time of the edge->caller + edge->callee execution when inlining
 466    does not happen.  */
 467
 468 inline gcov_type
 469 compute_uninlined_call_time (struct inline_summary *callee_info,
 470                              struct cgraph_edge *edge)
 471 {
 472   gcov_type uninlined_call_time =
 473     RDIV ((gcov_type)callee_info->time * MAX (edge->frequency, 1),
 474           CGRAPH_FREQ_BASE);
 475   gcov_type caller_time = inline_summary (edge->caller->global.inlined_to
 476                                           ? edge->caller->global.inlined_to
 477                                           : edge->caller)->time;
 478   return uninlined_call_time + caller_time;
 479 }
 480
 481 /* Same as compute_uinlined_call_time but compute time when inlining
 482    does happen.  */
 483
 484 inline gcov_type
 485 compute_inlined_call_time (struct cgraph_edge *edge,
 486                            int edge_time)
 487 {
 488   gcov_type caller_time = inline_summary (edge->caller->global.inlined_to
 489                                           ? edge->caller->global.inlined_to
 490                                           : edge->caller)->time;
 491   gcov_type time = (caller_time
 492                     + RDIV (((gcov_type) edge_time
 493                              - inline_edge_summary (edge)->call_stmt_time)
 494                     * MAX (edge->frequency, 1), CGRAPH_FREQ_BASE));
 495   /* Possible one roundoff error, but watch for overflows.  */
 496   gcc_checking_assert (time >= INT_MIN / 2);
 497   if (time < 0)
 498     time = 0;
 499   return time;
 500 }
 501
 502 /* Return true if the speedup for inlining E is bigger than
 503    PARAM_MAX_INLINE_MIN_SPEEDUP.  */
 504
 505 static bool
 506 big_speedup_p (struct cgraph_edge *e)
 507 {
 508   gcov_type time = compute_uninlined_call_time (inline_summary (e->callee),
 509                                                 e);
 510   gcov_type inlined_time = compute_inlined_call_time (e,
 511                                                       estimate_edge_time (e));
 512   if (time - inlined_time
 513       > RDIV (time * PARAM_VALUE (PARAM_INLINE_MIN_SPEEDUP), 100))
 514     return true;
 515   return false;
 516 }
 517
 518 /* Return true if we are interested in inlining small function.
 519    When REPORT is true, report reason to dump file.  */
 520
 521 static bool
 522 want_inline_small_function_p (struct cgraph_edge *e, bool report)
 523 {
 524   bool want_inline = true;
 525   struct cgraph_node *callee = cgraph_function_or_thunk_node (e->callee, NULL);
 526
 527   if (DECL_DISREGARD_INLINE_LIMITS (callee->symbol.decl))
 528     ;
 529   else if (!DECL_DECLARED_INLINE_P (callee->symbol.decl)
 530            && !flag_inline_small_functions)
 531     {
 532       e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
 533       want_inline = false;
 534     }
 535   else
 536     {
 537       int growth = estimate_edge_growth (e);
 538       inline_hints hints = estimate_edge_hints (e);
 539       bool big_speedup = big_speedup_p (e);
 540
 541       if (growth <= 0)
 542         ;
 543       /* Apply MAX_INLINE_INSNS_SINGLE limit.  Do not do so when
 544          hints suggests that inlining given function is very profitable.  */
 545       else if (DECL_DECLARED_INLINE_P (callee->symbol.decl)
 546                && growth >= MAX_INLINE_INSNS_SINGLE
 547                && !big_speedup
 548                && !(hints & (INLINE_HINT_indirect_call
 549                              | INLINE_HINT_loop_iterations
 550                              | INLINE_HINT_array_index
 551                              | INLINE_HINT_loop_stride)))
 552         {
 553           e->inline_failed = CIF_MAX_INLINE_INSNS_SINGLE_LIMIT;
 554           want_inline = false;
 555         }
 556       /* Before giving up based on fact that caller size will grow, allow
 557          functions that are called few times and eliminating the offline
 558          copy will lead to overall code size reduction.
 559          Not all of these will be handled by subsequent inlining of functions
 560          called once: in particular weak functions are not handled or funcitons
 561          that inline to multiple calls but a lot of bodies is optimized out.
 562          Finally we want to inline earlier to allow inlining of callbacks.
 563
 564          This is slightly wrong on aggressive side:  it is entirely possible
 565          that function is called many times with a context where inlining
 566          reduces code size and few times with a context where inlining increase
 567          code size.  Resoluting growth estimate will be negative even if it
 568          would make more sense to keep offline copy and do not inline into the
 569          call sites that makes the code size grow.
 570
 571          When badness orders the calls in a way that code reducing calls come
 572          first, this situation is not a problem at all: after inlining all
 573          "good" calls, we will realize that keeping the function around is
 574          better.  */
 575       else if (growth <= MAX_INLINE_INSNS_SINGLE
 576                /* Unlike for functions called once, we play unsafe with
 577                   COMDATs.  We can allow that since we know functions
 578                   in consideration are small (and thus risk is small) and
 579                   moreover grow estimates already accounts that COMDAT
 580                   functions may or may not disappear when eliminated from
 581                   current unit. With good probability making aggressive
 582                   choice in all units is going to make overall program
 583                   smaller.
 584
 585                   Consequently we ask cgraph_can_remove_if_no_direct_calls_p
 586                   instead of
 587                   cgraph_will_be_removed_from_program_if_no_direct_calls  */
 588                 && !DECL_EXTERNAL (callee->symbol.decl)
 589                 && cgraph_can_remove_if_no_direct_calls_p (callee)
 590                 && estimate_growth (callee) <= 0)
 591         ;
 592       else if (!DECL_DECLARED_INLINE_P (callee->symbol.decl)
 593                && !flag_inline_functions)
 594         {
 595           e->inline_failed = CIF_NOT_DECLARED_INLINED;
 596           want_inline = false;
 597         }
 598       /* Apply MAX_INLINE_INSNS_AUTO limit for functions not declared inline
 599          Upgrade it to MAX_INLINE_INSNS_SINGLE when hints suggests that
 600          inlining given function is very profitable.  */
 601       else if (!DECL_DECLARED_INLINE_P (callee->symbol.decl)
 602                && !big_speedup
 603                && growth >= ((hints & (INLINE_HINT_indirect_call
 604                                        | INLINE_HINT_loop_iterations
 605                                        | INLINE_HINT_array_index
 606                                        | INLINE_HINT_loop_stride))
 607                              ? MAX (MAX_INLINE_INSNS_AUTO,
 608                                     MAX_INLINE_INSNS_SINGLE)
 609                              : MAX_INLINE_INSNS_AUTO))
 610         {
 611           e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_LIMIT;
 612           want_inline = false;
 613         }
 614       /* If call is cold, do not inline when function body would grow. */
 615       else if (!cgraph_maybe_hot_edge_p (e))
 616         {
 617           e->inline_failed = CIF_UNLIKELY_CALL;
 618           want_inline = false;
 619         }
 620     }
 621   if (!want_inline && report)
 622     report_inline_failed_reason (e);
 623   return want_inline;
 624 }
 625
 626 /* EDGE is self recursive edge.
 627    We hand two cases - when function A is inlining into itself
 628    or when function A is being inlined into another inliner copy of function
 629    A within function B.
 630
 631    In first case OUTER_NODE points to the toplevel copy of A, while
 632    in the second case OUTER_NODE points to the outermost copy of A in B.
 633
 634    In both cases we want to be extra selective since
 635    inlining the call will just introduce new recursive calls to appear.  */
 636
 637 static bool
 638 want_inline_self_recursive_call_p (struct cgraph_edge *edge,
 639                                    struct cgraph_node *outer_node,
 640                                    bool peeling,
 641                                    int depth)
 642 {
 643   char const *reason = NULL;
 644   bool want_inline = true;
 645   int caller_freq = CGRAPH_FREQ_BASE;
 646   int max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH_AUTO);
 647
 648   if (DECL_DECLARED_INLINE_P (edge->caller->symbol.decl))
 649     max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH);
 650
 651   if (!cgraph_maybe_hot_edge_p (edge))
 652     {
 653       reason = "recursive call is cold";
 654       want_inline = false;
 655     }
 656   else if (max_count && !outer_node->count)
 657     {
 658       reason = "not executed in profile";
 659       want_inline = false;
 660     }
 661   else if (depth > max_depth)
 662     {
 663       reason = "--param max-inline-recursive-depth exceeded.";
 664       want_inline = false;
 665     }
 666
 667   if (outer_node->global.inlined_to)
 668     caller_freq = outer_node->callers->frequency;
 669
 670   if (!want_inline)
 671     ;
 672   /* Inlining of self recursive function into copy of itself within other function
 673      is transformation similar to loop peeling.
 674
 675      Peeling is profitable if we can inline enough copies to make probability
 676      of actual call to the self recursive function very small.  Be sure that
 677      the probability of recursion is small.
 678
 679      We ensure that the frequency of recursing is at most 1 - (1/max_depth).
 680      This way the expected number of recision is at most max_depth.  */
 681   else if (peeling)
 682     {
 683       int max_prob = CGRAPH_FREQ_BASE - ((CGRAPH_FREQ_BASE + max_depth - 1)
 684                                          / max_depth);
 685       int i;
 686       for (i = 1; i < depth; i++)
 687         max_prob = max_prob * max_prob / CGRAPH_FREQ_BASE;
 688       if (max_count
 689           && (edge->count * CGRAPH_FREQ_BASE / outer_node->count
 690               >= max_prob))
 691         {
 692           reason = "profile of recursive call is too large";
 693           want_inline = false;
 694         }
 695       if (!max_count
 696           && (edge->frequency * CGRAPH_FREQ_BASE / caller_freq
 697               >= max_prob))
 698         {
 699           reason = "frequency of recursive call is too large";
 700           want_inline = false;
 701         }
 702     }
 703   /* Recursive inlining, i.e. equivalent of unrolling, is profitable if recursion
 704      depth is large.  We reduce function call overhead and increase chances that
 705      things fit in hardware return predictor.
 706
 707      Recursive inlining might however increase cost of stack frame setup
 708      actually slowing down functions whose recursion tree is wide rather than
 709      deep.
 710
 711      Deciding reliably on when to do recursive inlining without profile feedback
 712      is tricky.  For now we disable recursive inlining when probability of self
 713      recursion is low.
 714
 715      Recursive inlining of self recursive call within loop also results in large loop
 716      depths that generally optimize badly.  We may want to throttle down inlining
 717      in those cases.  In particular this seems to happen in one of libstdc++ rb tree
 718      methods.  */
 719   else
 720     {
 721       if (max_count
 722           && (edge->count * 100 / outer_node->count
 723               <= PARAM_VALUE (PARAM_MIN_INLINE_RECURSIVE_PROBABILITY)))
 724         {
 725           reason = "profile of recursive call is too small";
 726           want_inline = false;
 727         }
 728       else if (!max_count
 729                && (edge->frequency * 100 / caller_freq
 730                    <= PARAM_VALUE (PARAM_MIN_INLINE_RECURSIVE_PROBABILITY)))
 731         {
 732           reason = "frequency of recursive call is too small";
 733           want_inline = false;
 734         }
 735     }
 736   if (!want_inline && dump_file)
 737     fprintf (dump_file, "   not inlining recursively: %s\n", reason);
 738   return want_inline;
 739 }
 740
 741 /* Return true when NODE has caller other than EDGE.
 742    Worker for cgraph_for_node_and_aliases.  */
 743
 744 static bool
 745 check_caller_edge (struct cgraph_node *node, void *edge)
 746 {
 747   return (node->callers
 748           && node->callers != edge);
 749 }
 750
 751
 752 /* Decide if inlining NODE would reduce unit size by eliminating
 753    the offline copy of function.
 754    When COLD is true the cold calls are considered, too.  */
 755
 756 static bool
 757 want_inline_function_to_all_callers_p (struct cgraph_node *node, bool cold)
 758 {
 759    struct cgraph_node *function = cgraph_function_or_thunk_node (node, NULL);
 760    struct cgraph_edge *e;
 761    bool has_hot_call = false;
 762
 763    /* Does it have callers?  */
 764    if (!node->callers)
 765      return false;
 766    /* Already inlined?  */
 767    if (function->global.inlined_to)
 768      return false;
 769    if (cgraph_function_or_thunk_node (node, NULL) != node)
 770      return false;
 771    /* Inlining into all callers would increase size?  */
 772    if (estimate_growth (node) > 0)
 773      return false;
 774    /* Maybe other aliases has more direct calls.  */
 775    if (cgraph_for_node_and_aliases (node, check_caller_edge, node->callers, true))
 776      return false;
 777    /* All inlines must be possible.  */
 778    for (e = node->callers; e; e = e->next_caller)
 779      {
 780        if (!can_inline_edge_p (e, true))
 781          return false;
 782        if (!has_hot_call && cgraph_maybe_hot_edge_p (e))
 783          has_hot_call = 1;
 784      }
 785
 786    if (!cold && !has_hot_call)
 787      return false;
 788    return true;
 789 }
 790
 791 #define RELATIVE_TIME_BENEFIT_RANGE (INT_MAX / 64)
 792
 793 /* Return relative time improvement for inlining EDGE in range
 794    1...RELATIVE_TIME_BENEFIT_RANGE  */
 795
 796 static inline int
 797 relative_time_benefit (struct inline_summary *callee_info,
 798                        struct cgraph_edge *edge,
 799                        int edge_time)
 800 {
 801   gcov_type relbenefit;
 802   gcov_type uninlined_call_time = compute_uninlined_call_time (callee_info, edge);
 803   gcov_type inlined_call_time = compute_inlined_call_time (edge, edge_time);
 804
 805   /* Inlining into extern inline function is not a win.  */
 806   if (DECL_EXTERNAL (edge->caller->global.inlined_to
 807                      ? edge->caller->global.inlined_to->symbol.decl
 808                      : edge->caller->symbol.decl))
 809     return 1;
 810
 811   /* Watch overflows.  */
 812   gcc_checking_assert (uninlined_call_time >= 0);
 813   gcc_checking_assert (inlined_call_time >= 0);
 814   gcc_checking_assert (uninlined_call_time >= inlined_call_time);
 815
 816   /* Compute relative time benefit, i.e. how much the call becomes faster.
 817      ??? perhaps computing how much the caller+calle together become faster
 818      would lead to more realistic results.  */
 819   if (!uninlined_call_time)
 820     uninlined_call_time = 1;
 821   relbenefit =
 822     RDIV (((gcov_type)uninlined_call_time - inlined_call_time) * RELATIVE_TIME_BENEFIT_RANGE,
 823           uninlined_call_time);
 824   relbenefit = MIN (relbenefit, RELATIVE_TIME_BENEFIT_RANGE);
 825   gcc_checking_assert (relbenefit >= 0);
 826   relbenefit = MAX (relbenefit, 1);
 827   return relbenefit;
 828 }
 829
 830
 831 /* A cost model driving the inlining heuristics in a way so the edges with
 832    smallest badness are inlined first.  After each inlining is performed
 833    the costs of all caller edges of nodes affected are recomputed so the
 834    metrics may accurately depend on values such as number of inlinable callers
 835    of the function or function body size.  */
 836
 837 static int
 838 edge_badness (struct cgraph_edge *edge, bool dump)
 839 {
 840   gcov_type badness;
 841   int growth, edge_time;
 842   struct cgraph_node *callee = cgraph_function_or_thunk_node (edge->callee,
 843                                                               NULL);
 844   struct inline_summary *callee_info = inline_summary (callee);
 845   inline_hints hints;
 846
 847   if (DECL_DISREGARD_INLINE_LIMITS (callee->symbol.decl))
 848     return INT_MIN;
 849
 850   growth = estimate_edge_growth (edge);
 851   edge_time = estimate_edge_time (edge);
 852   hints = estimate_edge_hints (edge);
 853   gcc_checking_assert (edge_time >= 0);
 854   gcc_checking_assert (edge_time <= callee_info->time);
 855   gcc_checking_assert (growth <= callee_info->size);
 856
 857   if (dump)
 858     {
 859       fprintf (dump_file, "    Badness calculation for %s/%i -> %s/%i\n",
 860                xstrdup (cgraph_node_name (edge->caller)),
 861                edge->caller->symbol.order,
 862                xstrdup (cgraph_node_name (callee)),
 863                edge->callee->symbol.order);
 864       fprintf (dump_file, "      size growth %i, time %i ",
 865                growth,
 866                edge_time);
 867       dump_inline_hints (dump_file, hints);
 868       if (big_speedup_p (edge))
 869         fprintf (dump_file, " big_speedup");
 870       fprintf (dump_file, "\n");
 871     }
 872
 873   /* Always prefer inlining saving code size.  */
 874   if (growth <= 0)
 875     {
 876       badness = INT_MIN / 2 + growth;
 877       if (dump)
 878         fprintf (dump_file, "      %i: Growth %i <= 0\n", (int) badness,
 879                  growth);
 880     }
 881
 882   /* When profiling is available, compute badness as:
 883
 884                 relative_edge_count * relative_time_benefit
 885      goodness = -------------------------------------------
 886                 growth_f_caller
 887      badness = -goodness
 888
 889     The fraction is upside down, because on edge counts and time beneits
 890     the bounds are known. Edge growth is essentially unlimited.  */
 891
 892   else if (max_count)
 893     {
 894       int relbenefit = relative_time_benefit (callee_info, edge, edge_time);
 895       badness =
 896         ((int)
 897          ((double) edge->count * INT_MIN / 2 / max_count / RELATIVE_TIME_BENEFIT_RANGE) *
 898          relbenefit) / growth;
 899
 900       /* Be sure that insanity of the profile won't lead to increasing counts
 901          in the scalling and thus to overflow in the computation above.  */
 902       gcc_assert (max_count >= edge->count);
 903       if (dump)
 904         {
 905           fprintf (dump_file,
 906                    "      %i (relative %f): profile info. Relative count %f"
 907                    " * Relative benefit %f\n",
 908                    (int) badness, (double) badness / INT_MIN,
 909                    (double) edge->count / max_count,
 910                    relbenefit * 100.0 / RELATIVE_TIME_BENEFIT_RANGE);
 911         }
 912     }
 913
 914   /* When function local profile is available. Compute badness as:
 915
 916                  relative_time_benefit
 917      goodness =  ---------------------------------
 918                  growth_of_caller * overall_growth
 919
 920      badness = - goodness
 921
 922      compensated by the inline hints.
 923   */
 924   else if (flag_guess_branch_prob)
 925     {
 926       badness = (relative_time_benefit (callee_info, edge, edge_time)
 927                  * (INT_MIN / 16 / RELATIVE_TIME_BENEFIT_RANGE));
 928       badness /= (MIN (65536/2, growth) * MIN (65536/2, MAX (1, callee_info->growth)));
 929       gcc_checking_assert (badness <=0 && badness >= INT_MIN / 16);
 930       if ((hints & (INLINE_HINT_indirect_call
 931                     | INLINE_HINT_loop_iterations
 932                     | INLINE_HINT_array_index
 933                     | INLINE_HINT_loop_stride))
 934           || callee_info->growth <= 0)
 935         badness *= 8;
 936       if (hints & (INLINE_HINT_same_scc))
 937         badness /= 16;
 938       else if (hints & (INLINE_HINT_in_scc))
 939         badness /= 8;
 940       else if (hints & (INLINE_HINT_cross_module))
 941         badness /= 2;
 942       gcc_checking_assert (badness <= 0 && badness >= INT_MIN / 2);
 943       if ((hints & INLINE_HINT_declared_inline) && badness >= INT_MIN / 32)
 944         badness *= 16;
 945       if (dump)
 946         {
 947           fprintf (dump_file,
 948                    "      %i: guessed profile. frequency %f,"
 949                    " benefit %f%%, time w/o inlining %i, time w inlining %i"
 950                    " overall growth %i (current) %i (original)\n",
 951                    (int) badness, (double)edge->frequency / CGRAPH_FREQ_BASE,
 952                    relative_time_benefit (callee_info, edge, edge_time) * 100.0
 953                    / RELATIVE_TIME_BENEFIT_RANGE,
 954                    (int)compute_uninlined_call_time (callee_info, edge),
 955                    (int)compute_inlined_call_time (edge, edge_time),
 956                    estimate_growth (callee),
 957                    callee_info->growth);
 958         }
 959     }
 960   /* When function local profile is not available or it does not give
 961      useful information (ie frequency is zero), base the cost on
 962      loop nest and overall size growth, so we optimize for overall number
 963      of functions fully inlined in program.  */
 964   else
 965     {
 966       int nest = MIN (inline_edge_summary (edge)->loop_depth, 8);
 967       badness = growth * 256;
 968
 969       /* Decrease badness if call is nested.  */
 970       if (badness > 0)
 971         badness >>= nest;
 972       else
 973         {
 974           badness <<= nest;
 975         }
 976       if (dump)
 977         fprintf (dump_file, "      %i: no profile. nest %i\n", (int) badness,
 978                  nest);
 979     }
 980
 981   /* Ensure that we did not overflow in all the fixed point math above.  */
 982   gcc_assert (badness >= INT_MIN);
 983   gcc_assert (badness <= INT_MAX - 1);
 984   /* Make recursive inlining happen always after other inlining is done.  */
 985   if (cgraph_edge_recursive_p (edge))
 986     return badness + 1;
 987   else
 988     return badness;
 989 }
 990
 991 /* Recompute badness of EDGE and update its key in HEAP if needed.  */
 992 static inline void
 993 update_edge_key (fibheap_t heap, struct cgraph_edge *edge)
 994 {
 995   int badness = edge_badness (edge, false);
 996   if (edge->aux)
 997     {
 998       fibnode_t n = (fibnode_t) edge->aux;
 999       gcc_checking_assert (n->data == edge);
1000
1001       /* fibheap_replace_key only decrease the keys.
1002          When we increase the key we do not update heap
1003          and instead re-insert the element once it becomes
1004          a minimum of heap.  */
1005       if (badness < n->key)
1006         {
1007           if (dump_file && (dump_flags & TDF_DETAILS))
1008             {
1009               fprintf (dump_file,
1010                        "  decreasing badness %s/%i -> %s/%i, %i to %i\n",
1011                        xstrdup (cgraph_node_name (edge->caller)),
1012                        edge->caller->symbol.order,
1013                        xstrdup (cgraph_node_name (edge->callee)),
1014                        edge->callee->symbol.order,
1015                        (int)n->key,
1016                        badness);
1017             }
1018           fibheap_replace_key (heap, n, badness);
1019           gcc_checking_assert (n->key == badness);
1020         }
1021     }
1022   else
1023     {
1024        if (dump_file && (dump_flags & TDF_DETAILS))
1025          {
1026            fprintf (dump_file,
1027                     "  enqueuing call %s/%i -> %s/%i, badness %i\n",
1028                     xstrdup (cgraph_node_name (edge->caller)),
1029                     edge->caller->symbol.order,
1030                     xstrdup (cgraph_node_name (edge->callee)),
1031                     edge->callee->symbol.order,
1032                     badness);
1033          }
1034       edge->aux = fibheap_insert (heap, badness, edge);
1035     }
1036 }
1037
1038
1039 /* NODE was inlined.
1040    All caller edges needs to be resetted because
1041    size estimates change. Similarly callees needs reset
1042    because better context may be known.  */
1043
1044 static void
1045 reset_edge_caches (struct cgraph_node *node)
1046 {
1047   struct cgraph_edge *edge;
1048   struct cgraph_edge *e = node->callees;
1049   struct cgraph_node *where = node;
1050   int i;
1051   struct ipa_ref *ref;
1052
1053   if (where->global.inlined_to)
1054     where = where->global.inlined_to;
1055
1056   /* WHERE body size has changed, the cached growth is invalid.  */
1057   reset_node_growth_cache (where);
1058
1059   for (edge = where->callers; edge; edge = edge->next_caller)
1060     if (edge->inline_failed)
1061       reset_edge_growth_cache (edge);
1062   for (i = 0; ipa_ref_list_referring_iterate (&where->symbol.ref_list,
1063                                               i, ref); i++)
1064     if (ref->use == IPA_REF_ALIAS)
1065       reset_edge_caches (ipa_ref_referring_node (ref));
1066
1067   if (!e)
1068     return;
1069
1070   while (true)
1071     if (!e->inline_failed && e->callee->callees)
1072       e = e->callee->callees;
1073     else
1074       {
1075         if (e->inline_failed)
1076           reset_edge_growth_cache (e);
1077         if (e->next_callee)
1078           e = e->next_callee;
1079         else
1080           {
1081             do
1082               {
1083                 if (e->caller == node)
1084                   return;
1085                 e = e->caller->callers;
1086               }
1087             while (!e->next_callee);
1088             e = e->next_callee;
1089           }
1090       }
1091 }
1092
1093 /* Recompute HEAP nodes for each of caller of NODE.
1094    UPDATED_NODES track nodes we already visited, to avoid redundant work.
1095    When CHECK_INLINABLITY_FOR is set, re-check for specified edge that
1096    it is inlinable. Otherwise check all edges.  */
1097
1098 static void
1099 update_caller_keys (fibheap_t heap, struct cgraph_node *node,
1100                     bitmap updated_nodes,
1101                     struct cgraph_edge *check_inlinablity_for)
1102 {
1103   struct cgraph_edge *edge;
1104   int i;
1105   struct ipa_ref *ref;
1106
1107   if ((!node->symbol.alias && !inline_summary (node)->inlinable)
1108       || node->global.inlined_to)
1109     return;
1110   if (!bitmap_set_bit (updated_nodes, node->uid))
1111     return;
1112
1113   for (i = 0; ipa_ref_list_referring_iterate (&node->symbol.ref_list,
1114                                               i, ref); i++)
1115     if (ref->use == IPA_REF_ALIAS)
1116       {
1117         struct cgraph_node *alias = ipa_ref_referring_node (ref);
1118         update_caller_keys (heap, alias, updated_nodes, check_inlinablity_for);
1119       }
1120
1121   for (edge = node->callers; edge; edge = edge->next_caller)
1122     if (edge->inline_failed)
1123       {
1124         if (!check_inlinablity_for
1125             || check_inlinablity_for == edge)
1126           {
1127             if (can_inline_edge_p (edge, false)
1128                 && want_inline_small_function_p (edge, false))
1129               update_edge_key (heap, edge);
1130             else if (edge->aux)
1131               {
1132                 report_inline_failed_reason (edge);
1133                 fibheap_delete_node (heap, (fibnode_t) edge->aux);
1134                 edge->aux = NULL;
1135               }
1136           }
1137         else if (edge->aux)
1138           update_edge_key (heap, edge);
1139       }
1140 }
1141
1142 /* Recompute HEAP nodes for each uninlined call in NODE.
1143    This is used when we know that edge badnesses are going only to increase
1144    (we introduced new call site) and thus all we need is to insert newly
1145    created edges into heap.  */
1146
1147 static void
1148 update_callee_keys (fibheap_t heap, struct cgraph_node *node,
1149                     bitmap updated_nodes)
1150 {
1151   struct cgraph_edge *e = node->callees;
1152
1153   if (!e)
1154     return;
1155   while (true)
1156     if (!e->inline_failed && e->callee->callees)
1157       e = e->callee->callees;
1158     else
1159       {
1160         enum availability avail;
1161         struct cgraph_node *callee;
1162         /* We do not reset callee growth cache here.  Since we added a new call,
1163            growth chould have just increased and consequentely badness metric
1164            don't need updating.  */
1165         if (e->inline_failed
1166             && (callee = cgraph_function_or_thunk_node (e->callee, &avail))
1167             && inline_summary (callee)->inlinable
1168             && avail >= AVAIL_AVAILABLE
1169             && !bitmap_bit_p (updated_nodes, callee->uid))
1170           {
1171             if (can_inline_edge_p (e, false)
1172                 && want_inline_small_function_p (e, false))
1173               update_edge_key (heap, e);
1174             else if (e->aux)
1175               {
1176                 report_inline_failed_reason (e);
1177                 fibheap_delete_node (heap, (fibnode_t) e->aux);
1178                 e->aux = NULL;
1179               }
1180           }
1181         if (e->next_callee)
1182           e = e->next_callee;
1183         else
1184           {
1185             do
1186               {
1187                 if (e->caller == node)
1188                   return;
1189                 e = e->caller->callers;
1190               }
1191             while (!e->next_callee);
1192             e = e->next_callee;
1193           }
1194       }
1195 }
1196
1197 /* Enqueue all recursive calls from NODE into priority queue depending on
1198    how likely we want to recursively inline the call.  */
1199
1200 static void
1201 lookup_recursive_calls (struct cgraph_node *node, struct cgraph_node *where,
1202                         fibheap_t heap)
1203 {
1204   struct cgraph_edge *e;
1205   enum availability avail;
1206
1207   for (e = where->callees; e; e = e->next_callee)
1208     if (e->callee == node
1209         || (cgraph_function_or_thunk_node (e->callee, &avail) == node
1210             && avail > AVAIL_OVERWRITABLE))
1211       {
1212         /* When profile feedback is available, prioritize by expected number
1213            of calls.  */
1214         fibheap_insert (heap,
1215                         !max_count ? -e->frequency
1216                         : -(e->count / ((max_count + (1<<24) - 1) / (1<<24))),
1217                         e);
1218       }
1219   for (e = where->callees; e; e = e->next_callee)
1220     if (!e->inline_failed)
1221       lookup_recursive_calls (node, e->callee, heap);
1222 }
1223
1224 /* Decide on recursive inlining: in the case function has recursive calls,
1225    inline until body size reaches given argument.  If any new indirect edges
1226    are discovered in the process, add them to *NEW_EDGES, unless NEW_EDGES
1227    is NULL.  */
1228
1229 static bool
1230 recursive_inlining (struct cgraph_edge *edge,
1231                     vec<cgraph_edge_p> *new_edges)
1232 {
1233   int limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE_AUTO);
1234   fibheap_t heap;
1235   struct cgraph_node *node;
1236   struct cgraph_edge *e;
1237   struct cgraph_node *master_clone = NULL, *next;
1238   int depth = 0;
1239   int n = 0;
1240
1241   node = edge->caller;
1242   if (node->global.inlined_to)
1243     node = node->global.inlined_to;
1244
1245   if (DECL_DECLARED_INLINE_P (node->symbol.decl))
1246     limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE);
1247
1248   /* Make sure that function is small enough to be considered for inlining.  */
1249   if (estimate_size_after_inlining (node, edge)  >= limit)
1250     return false;
1251   heap = fibheap_new ();
1252   lookup_recursive_calls (node, node, heap);
1253   if (fibheap_empty (heap))
1254     {
1255       fibheap_delete (heap);
1256       return false;
1257     }
1258
1259   if (dump_file)
1260     fprintf (dump_file,
1261              "  Performing recursive inlining on %s\n",
1262              cgraph_node_name (node));
1263
1264   /* Do the inlining and update list of recursive call during process.  */
1265   while (!fibheap_empty (heap))
1266     {
1267       struct cgraph_edge *curr
1268         = (struct cgraph_edge *) fibheap_extract_min (heap);
1269       struct cgraph_node *cnode, *dest = curr->callee;
1270
1271       if (!can_inline_edge_p (curr, true))
1272         continue;
1273
1274       /* MASTER_CLONE is produced in the case we already started modified
1275          the function. Be sure to redirect edge to the original body before
1276          estimating growths otherwise we will be seeing growths after inlining
1277          the already modified body.  */
1278       if (master_clone)
1279         {
1280           cgraph_redirect_edge_callee (curr, master_clone);
1281           reset_edge_growth_cache (curr);
1282         }
1283
1284       if (estimate_size_after_inlining (node, curr) > limit)
1285         {
1286           cgraph_redirect_edge_callee (curr, dest);
1287           reset_edge_growth_cache (curr);
1288           break;
1289         }
1290
1291       depth = 1;
1292       for (cnode = curr->caller;
1293            cnode->global.inlined_to; cnode = cnode->callers->caller)
1294         if (node->symbol.decl
1295             == cgraph_function_or_thunk_node (curr->callee, NULL)->symbol.decl)
1296           depth++;
1297
1298       if (!want_inline_self_recursive_call_p (curr, node, false, depth))
1299         {
1300           cgraph_redirect_edge_callee (curr, dest);
1301           reset_edge_growth_cache (curr);
1302           continue;
1303         }
1304
1305       if (dump_file)
1306         {
1307           fprintf (dump_file,
1308                    "   Inlining call of depth %i", depth);
1309           if (node->count)
1310             {
1311               fprintf (dump_file, " called approx. %.2f times per call",
1312                        (double)curr->count / node->count);
1313             }
1314           fprintf (dump_file, "\n");
1315         }
1316       if (!master_clone)
1317         {
1318           /* We need original clone to copy around.  */
1319           master_clone = cgraph_clone_node (node, node->symbol.decl,
1320                                             node->count, CGRAPH_FREQ_BASE,
1321                                             false, vNULL, true, NULL);
1322           for (e = master_clone->callees; e; e = e->next_callee)
1323             if (!e->inline_failed)
1324               clone_inlined_nodes (e, true, false, NULL);
1325           cgraph_redirect_edge_callee (curr, master_clone);
1326           reset_edge_growth_cache (curr);
1327         }
1328
1329       inline_call (curr, false, new_edges, &overall_size, true);
1330       lookup_recursive_calls (node, curr->callee, heap);
1331       n++;
1332     }
1333
1334   if (!fibheap_empty (heap) && dump_file)
1335     fprintf (dump_file, "    Recursive inlining growth limit met.\n");
1336   fibheap_delete (heap);
1337
1338   if (!master_clone)
1339     return false;
1340
1341   if (dump_file)
1342     fprintf (dump_file,
1343              "\n   Inlined %i times, "
1344              "body grown from size %i to %i, time %i to %i\n", n,
1345              inline_summary (master_clone)->size, inline_summary (node)->size,
1346              inline_summary (master_clone)->time, inline_summary (node)->time);
1347
1348   /* Remove master clone we used for inlining.  We rely that clones inlined
1349      into master clone gets queued just before master clone so we don't
1350      need recursion.  */
1351   for (node = cgraph_first_function (); node != master_clone;
1352        node = next)
1353     {
1354       next = cgraph_next_function (node);
1355       if (node->global.inlined_to == master_clone)
1356         cgraph_remove_node (node);
1357     }
1358   cgraph_remove_node (master_clone);
1359   return true;
1360 }
1361
1362
1363 /* Given whole compilation unit estimate of INSNS, compute how large we can
1364    allow the unit to grow.  */
1365
1366 static int
1367 compute_max_insns (int insns)
1368 {
1369   int max_insns = insns;
1370   if (max_insns < PARAM_VALUE (PARAM_LARGE_UNIT_INSNS))
1371     max_insns = PARAM_VALUE (PARAM_LARGE_UNIT_INSNS);
1372
1373   return ((HOST_WIDEST_INT) max_insns
1374           * (100 + PARAM_VALUE (PARAM_INLINE_UNIT_GROWTH)) / 100);
1375 }
1376
1377
1378 /* Compute badness of all edges in NEW_EDGES and add them to the HEAP.  */
1379
1380 static void
1381 add_new_edges_to_heap (fibheap_t heap, vec<cgraph_edge_p> new_edges)
1382 {
1383   while (new_edges.length () > 0)
1384     {
1385       struct cgraph_edge *edge = new_edges.pop ();
1386
1387       gcc_assert (!edge->aux);
1388       if (edge->inline_failed
1389           && can_inline_edge_p (edge, true)
1390           && want_inline_small_function_p (edge, true))
1391         edge->aux = fibheap_insert (heap, edge_badness (edge, false), edge);
1392     }
1393 }
1394
1395 /* Remove EDGE from the fibheap.  */
1396
1397 static void
1398 heap_edge_removal_hook (struct cgraph_edge *e, void *data)
1399 {
1400   if (e->aux)
1401     {
1402       fibheap_delete_node ((fibheap_t)data, (fibnode_t)e->aux);
1403       e->aux = NULL;
1404     }
1405 }
1406
1407 /* Return true if speculation of edge E seems useful.
1408    If ANTICIPATE_INLINING is true, be conservative and hope that E
1409    may get inlined.  */
1410
1411 bool
1412 speculation_useful_p (struct cgraph_edge *e, bool anticipate_inlining)
1413 {
1414   enum availability avail;
1415   struct cgraph_node *target = cgraph_function_or_thunk_node (e->callee, &avail);
1416   struct cgraph_edge *direct, *indirect;
1417   struct ipa_ref *ref;
1418
1419   gcc_assert (e->speculative && !e->indirect_unknown_callee);
1420
1421   if (!cgraph_maybe_hot_edge_p (e))
1422     return false;
1423
1424   /* See if IP optimizations found something potentially useful about the
1425      function.  For now we look only for CONST/PURE flags.  Almost everything
1426      else we propagate is useless.  */
1427   if (avail >= AVAIL_AVAILABLE)
1428     {
1429       int ecf_flags = flags_from_decl_or_type (target->symbol.decl);
1430       if (ecf_flags & ECF_CONST)
1431         {
1432           cgraph_speculative_call_info (e, direct, indirect, ref);
1433           if (!(indirect->indirect_info->ecf_flags & ECF_CONST))
1434             return true;
1435         }
1436       else if (ecf_flags & ECF_PURE)
1437         {
1438           cgraph_speculative_call_info (e, direct, indirect, ref);
1439           if (!(indirect->indirect_info->ecf_flags & ECF_PURE))
1440             return true;
1441         }
1442     }
1443   /* If we did not managed to inline the function nor redirect
1444      to an ipa-cp clone (that are seen by having local flag set),
1445      it is probably pointless to inline it unless hardware is missing
1446      indirect call predictor.  */
1447   if (!anticipate_inlining && e->inline_failed && !target->local.local)
1448     return false;
1449   /* For overwritable targets there is not much to do.  */
1450   if (e->inline_failed && !can_inline_edge_p (e, false, true))
1451     return false;
1452   /* OK, speculation seems interesting.  */
1453   return true;
1454 }
1455
1456 /* We know that EDGE is not going to be inlined.
1457    See if we can remove speculation.  */
1458
1459 static void
1460 resolve_noninline_speculation (fibheap_t edge_heap, struct cgraph_edge *edge)
1461 {
1462   if (edge->speculative && !speculation_useful_p (edge, false))
1463     {
1464       struct cgraph_node *node = edge->caller;
1465       struct cgraph_node *where = node->global.inlined_to
1466                                   ? node->global.inlined_to : node;
1467       bitmap updated_nodes = BITMAP_ALLOC (NULL);
1468
1469       cgraph_resolve_speculation (edge, NULL);
1470       reset_node_growth_cache (where);
1471       reset_edge_caches (where);
1472       inline_update_overall_summary (where);
1473       update_caller_keys (edge_heap, where,
1474                           updated_nodes, NULL);
1475       reset_node_growth_cache (where);
1476       BITMAP_FREE (updated_nodes);
1477     }
1478 }
1479
1480 /* We use greedy algorithm for inlining of small functions:
1481    All inline candidates are put into prioritized heap ordered in
1482    increasing badness.
1483
1484    The inlining of small functions is bounded by unit growth parameters.  */
1485
1486 static void
1487 inline_small_functions (void)
1488 {
1489   struct cgraph_node *node;
1490   struct cgraph_edge *edge;
1491   fibheap_t edge_heap = fibheap_new ();
1492   bitmap updated_nodes = BITMAP_ALLOC (NULL);
1493   int min_size, max_size;
1494   vec<cgraph_edge_p> new_indirect_edges = vNULL;
1495   int initial_size = 0;
1496   struct cgraph_node **order = XCNEWVEC (struct cgraph_node *, cgraph_n_nodes);
1497   struct cgraph_edge_hook_list *edge_removal_hook_holder;
1498
1499   if (flag_indirect_inlining)
1500     new_indirect_edges.create (8);
1501
1502   edge_removal_hook_holder
1503     = cgraph_add_edge_removal_hook (&heap_edge_removal_hook, edge_heap);
1504
1505   /* Compute overall unit size and other global parameters used by badness
1506      metrics.  */
1507
1508   max_count = 0;
1509   ipa_reduced_postorder (order, true, true, NULL);
1510   free (order);
1511
1512   FOR_EACH_DEFINED_FUNCTION (node)
1513     if (!node->global.inlined_to)
1514       {
1515         if (cgraph_function_with_gimple_body_p (node)
1516             || node->thunk.thunk_p)
1517           {
1518             struct inline_summary *info = inline_summary (node);
1519             struct ipa_dfs_info *dfs = (struct ipa_dfs_info *) node->symbol.aux;
1520
1521             if (!DECL_EXTERNAL (node->symbol.decl))
1522               initial_size += info->size;
1523             info->growth = estimate_growth (node);
1524             if (dfs && dfs->next_cycle)
1525               {
1526                 struct cgraph_node *n2;
1527                 int id = dfs->scc_no + 1;
1528                 for (n2 = node; n2;
1529                      n2 = ((struct ipa_dfs_info *) node->symbol.aux)->next_cycle)
1530                   {
1531                     struct inline_summary *info2 = inline_summary (n2);
1532                     if (info2->scc_no)
1533                       break;
1534                     info2->scc_no = id;
1535                   }
1536               }
1537           }
1538
1539         for (edge = node->callers; edge; edge = edge->next_caller)
1540           if (max_count < edge->count)
1541             max_count = edge->count;
1542       }
1543   ipa_free_postorder_info ();
1544   initialize_growth_caches ();
1545
1546   if (dump_file)
1547     fprintf (dump_file,
1548              "\nDeciding on inlining of small functions.  Starting with size %i.\n",
1549              initial_size);
1550
1551   overall_size = initial_size;
1552   max_size = compute_max_insns (overall_size);
1553   min_size = overall_size;
1554
1555   /* Populate the heeap with all edges we might inline.  */
1556
1557   FOR_EACH_DEFINED_FUNCTION (node)
1558     {
1559       bool update = false;
1560       struct cgraph_edge *next;
1561
1562       if (dump_file)
1563         fprintf (dump_file, "Enqueueing calls in %s/%i.\n",
1564                  cgraph_node_name (node), node->symbol.order);
1565
1566       for (edge = node->callees; edge; edge = next)
1567         {
1568           next = edge->next_callee;
1569           if (edge->inline_failed
1570               && !edge->aux
1571               && can_inline_edge_p (edge, true)
1572               && want_inline_small_function_p (edge, true)
1573               && edge->inline_failed)
1574             {
1575               gcc_assert (!edge->aux);
1576               update_edge_key (edge_heap, edge);
1577             }
1578           if (edge->speculative && !speculation_useful_p (edge, edge->aux != NULL))
1579             {
1580               cgraph_resolve_speculation (edge, NULL);
1581               update = true;
1582             }
1583         }
1584       if (update)
1585         {
1586           struct cgraph_node *where = node->global.inlined_to
1587                                       ? node->global.inlined_to : node;
1588           inline_update_overall_summary (where);
1589           reset_node_growth_cache (where);
1590           reset_edge_caches (where);
1591           update_caller_keys (edge_heap, where,
1592                               updated_nodes, NULL);
1593           bitmap_clear (updated_nodes);
1594         }
1595     }
1596
1597   gcc_assert (in_lto_p
1598               || !max_count
1599               || (profile_info && flag_branch_probabilities));
1600
1601   while (!fibheap_empty (edge_heap))
1602     {
1603       int old_size = overall_size;
1604       struct cgraph_node *where, *callee;
1605       int badness = fibheap_min_key (edge_heap);
1606       int current_badness;
1607       int cached_badness;
1608       int growth;
1609
1610       edge = (struct cgraph_edge *) fibheap_extract_min (edge_heap);
1611       gcc_assert (edge->aux);
1612       edge->aux = NULL;
1613       if (!edge->inline_failed)
1614         continue;
1615
1616       /* Be sure that caches are maintained consistent.
1617          We can not make this ENABLE_CHECKING only because it cause different
1618          updates of the fibheap queue.  */
1619       cached_badness = edge_badness (edge, false);
1620       reset_edge_growth_cache (edge);
1621       reset_node_growth_cache (edge->callee);
1622
1623       /* When updating the edge costs, we only decrease badness in the keys.
1624          Increases of badness are handled lazilly; when we see key with out
1625          of date value on it, we re-insert it now.  */
1626       current_badness = edge_badness (edge, false);
1627       gcc_assert (cached_badness == current_badness);
1628       gcc_assert (current_badness >= badness);
1629       if (current_badness != badness)
1630         {
1631           edge->aux = fibheap_insert (edge_heap, current_badness, edge);
1632           continue;
1633         }
1634
1635       if (!can_inline_edge_p (edge, true))
1636         {
1637           resolve_noninline_speculation (edge_heap, edge);
1638           continue;
1639         }
1640
1641       callee = cgraph_function_or_thunk_node (edge->callee, NULL);
1642       growth = estimate_edge_growth (edge);
1643       if (dump_file)
1644         {
1645           fprintf (dump_file,
1646                    "\nConsidering %s/%i with %i size\n",
1647                    cgraph_node_name (callee), callee->symbol.order,
1648                    inline_summary (callee)->size);
1649           fprintf (dump_file,
1650                    " to be inlined into %s/%i in %s:%i\n"
1651                    " Estimated growth after inlined into all is %+i insns.\n"
1652                    " Estimated badness is %i, frequency %.2f.\n",
1653                    cgraph_node_name (edge->caller), edge->caller->symbol.order,
1654                    flag_wpa ? "unknown"
1655                    : gimple_filename ((const_gimple) edge->call_stmt),
1656                    flag_wpa ? -1
1657                    : gimple_lineno ((const_gimple) edge->call_stmt),
1658                    estimate_growth (callee),
1659                    badness,
1660                    edge->frequency / (double)CGRAPH_FREQ_BASE);
1661           if (edge->count)
1662             fprintf (dump_file," Called "HOST_WIDEST_INT_PRINT_DEC"x\n",
1663                      edge->count);
1664           if (dump_flags & TDF_DETAILS)
1665             edge_badness (edge, true);
1666         }
1667
1668       if (overall_size + growth > max_size
1669           && !DECL_DISREGARD_INLINE_LIMITS (callee->symbol.decl))
1670         {
1671           edge->inline_failed = CIF_INLINE_UNIT_GROWTH_LIMIT;
1672           report_inline_failed_reason (edge);
1673           resolve_noninline_speculation (edge_heap, edge);
1674           continue;
1675         }
1676
1677       if (!want_inline_small_function_p (edge, true))
1678         {
1679           resolve_noninline_speculation (edge_heap, edge);
1680           continue;
1681         }
1682
1683       /* Heuristics for inlining small functions works poorly for
1684          recursive calls where we do efect similar to loop unrolling.
1685          When inliing such edge seems profitable, leave decision on
1686          specific inliner.  */
1687       if (cgraph_edge_recursive_p (edge))
1688         {
1689           where = edge->caller;
1690           if (where->global.inlined_to)
1691             where = where->global.inlined_to;
1692           if (!recursive_inlining (edge,
1693                                    flag_indirect_inlining
1694                                    ? &new_indirect_edges : NULL))
1695             {
1696               edge->inline_failed = CIF_RECURSIVE_INLINING;
1697               resolve_noninline_speculation (edge_heap, edge);
1698               continue;
1699             }
1700           reset_edge_caches (where);
1701           /* Recursive inliner inlines all recursive calls of the function
1702              at once. Consequently we need to update all callee keys.  */
1703           if (flag_indirect_inlining)
1704             add_new_edges_to_heap (edge_heap, new_indirect_edges);
1705           update_callee_keys (edge_heap, where, updated_nodes);
1706           bitmap_clear (updated_nodes);
1707         }
1708       else
1709         {
1710           struct cgraph_node *outer_node = NULL;
1711           int depth = 0;
1712
1713           /* Consider the case where self recursive function A is inlined into B.
1714              This is desired optimization in some cases, since it leads to effect
1715              similar of loop peeling and we might completely optimize out the
1716              recursive call.  However we must be extra selective.  */
1717
1718           where = edge->caller;
1719           while (where->global.inlined_to)
1720             {
1721               if (where->symbol.decl == callee->symbol.decl)
1722                 outer_node = where, depth++;
1723               where = where->callers->caller;
1724             }
1725           if (outer_node
1726               && !want_inline_self_recursive_call_p (edge, outer_node,
1727                                                      true, depth))
1728             {
1729               edge->inline_failed
1730                 = (DECL_DISREGARD_INLINE_LIMITS (edge->callee->symbol.decl)
1731                    ? CIF_RECURSIVE_INLINING : CIF_UNSPECIFIED);
1732               resolve_noninline_speculation (edge_heap, edge);
1733               continue;
1734             }
1735           else if (depth && dump_file)
1736             fprintf (dump_file, " Peeling recursion with depth %i\n", depth);
1737
1738           gcc_checking_assert (!callee->global.inlined_to);
1739           inline_call (edge, true, &new_indirect_edges, &overall_size, true);
1740           if (flag_indirect_inlining)
1741             add_new_edges_to_heap (edge_heap, new_indirect_edges);
1742
1743           reset_edge_caches (edge->callee);
1744           reset_node_growth_cache (callee);
1745
1746           update_callee_keys (edge_heap, where, updated_nodes);
1747         }
1748       where = edge->caller;
1749       if (where->global.inlined_to)
1750         where = where->global.inlined_to;
1751
1752       /* Our profitability metric can depend on local properties
1753          such as number of inlinable calls and size of the function body.
1754          After inlining these properties might change for the function we
1755          inlined into (since it's body size changed) and for the functions
1756          called by function we inlined (since number of it inlinable callers
1757          might change).  */
1758       update_caller_keys (edge_heap, where, updated_nodes, NULL);
1759       bitmap_clear (updated_nodes);
1760
1761       if (dump_file)
1762         {
1763           fprintf (dump_file,
1764                    " Inlined into %s which now has time %i and size %i,"
1765                    "net change of %+i.\n",
1766                    cgraph_node_name (edge->caller),
1767                    inline_summary (edge->caller)->time,
1768                    inline_summary (edge->caller)->size,
1769                    overall_size - old_size);
1770         }
1771       if (min_size > overall_size)
1772         {
1773           min_size = overall_size;
1774           max_size = compute_max_insns (min_size);
1775
1776           if (dump_file)
1777             fprintf (dump_file, "New minimal size reached: %i\n", min_size);
1778         }
1779     }
1780
1781   free_growth_caches ();
1782   new_indirect_edges.release ();
1783   fibheap_delete (edge_heap);
1784   if (dump_file)
1785     fprintf (dump_file,
1786              "Unit growth for small function inlining: %i->%i (%i%%)\n",
1787              initial_size, overall_size,
1788              initial_size ? overall_size * 100 / (initial_size) - 100: 0);
1789   BITMAP_FREE (updated_nodes);
1790   cgraph_remove_edge_removal_hook (edge_removal_hook_holder);
1791 }
1792
1793 /* Flatten NODE.  Performed both during early inlining and
1794    at IPA inlining time.  */
1795
1796 static void
1797 flatten_function (struct cgraph_node *node, bool early)
1798 {
1799   struct cgraph_edge *e;
1800
1801   /* We shouldn't be called recursively when we are being processed.  */
1802   gcc_assert (node->symbol.aux == NULL);
1803
1804   node->symbol.aux = (void *) node;
1805
1806   for (e = node->callees; e; e = e->next_callee)
1807     {
1808       struct cgraph_node *orig_callee;
1809       struct cgraph_node *callee = cgraph_function_or_thunk_node (e->callee, NULL);
1810
1811       /* We've hit cycle?  It is time to give up.  */
1812       if (callee->symbol.aux)
1813         {
1814           if (dump_file)
1815             fprintf (dump_file,
1816                      "Not inlining %s into %s to avoid cycle.\n",
1817                      xstrdup (cgraph_node_name (callee)),
1818                      xstrdup (cgraph_node_name (e->caller)));
1819           e->inline_failed = CIF_RECURSIVE_INLINING;
1820           continue;
1821         }
1822
1823       /* When the edge is already inlined, we just need to recurse into
1824          it in order to fully flatten the leaves.  */
1825       if (!e->inline_failed)
1826         {
1827           flatten_function (callee, early);
1828           continue;
1829         }
1830
1831       /* Flatten attribute needs to be processed during late inlining. For
1832          extra code quality we however do flattening during early optimization,
1833          too.  */
1834       if (!early
1835           ? !can_inline_edge_p (e, true)
1836           : !can_early_inline_edge_p (e))
1837         continue;
1838
1839       if (cgraph_edge_recursive_p (e))
1840         {
1841           if (dump_file)
1842             fprintf (dump_file, "Not inlining: recursive call.\n");
1843           continue;
1844         }
1845
1846       if (gimple_in_ssa_p (DECL_STRUCT_FUNCTION (node->symbol.decl))
1847           != gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->symbol.decl)))
1848         {
1849           if (dump_file)
1850             fprintf (dump_file, "Not inlining: SSA form does not match.\n");
1851           continue;
1852         }
1853
1854       /* Inline the edge and flatten the inline clone.  Avoid
1855          recursing through the original node if the node was cloned.  */
1856       if (dump_file)
1857         fprintf (dump_file, " Inlining %s into %s.\n",
1858                  xstrdup (cgraph_node_name (callee)),
1859                  xstrdup (cgraph_node_name (e->caller)));
1860       orig_callee = callee;
1861       inline_call (e, true, NULL, NULL, false);
1862       if (e->callee != orig_callee)
1863         orig_callee->symbol.aux = (void *) node;
1864       flatten_function (e->callee, early);
1865       if (e->callee != orig_callee)
1866         orig_callee->symbol.aux = NULL;
1867     }
1868
1869   node->symbol.aux = NULL;
1870   if (!node->global.inlined_to)
1871     inline_update_overall_summary (node);
1872 }
1873
1874 /* Decide on the inlining.  We do so in the topological order to avoid
1875    expenses on updating data structures.  */
1876
1877 static unsigned int
1878 ipa_inline (void)
1879 {
1880   struct cgraph_node *node;
1881   int nnodes;
1882   struct cgraph_node **order =
1883     XCNEWVEC (struct cgraph_node *, cgraph_n_nodes);
1884   int i;
1885   int cold;
1886
1887   if (in_lto_p && optimize)
1888     ipa_update_after_lto_read ();
1889
1890   if (dump_file)
1891     dump_inline_summaries (dump_file);
1892
1893   nnodes = ipa_reverse_postorder (order);
1894
1895   FOR_EACH_FUNCTION (node)
1896     node->symbol.aux = 0;
1897
1898   if (dump_file)
1899     fprintf (dump_file, "\nFlattening functions:\n");
1900
1901   /* In the first pass handle functions to be flattened.  Do this with
1902      a priority so none of our later choices will make this impossible.  */
1903   for (i = nnodes - 1; i >= 0; i--)
1904     {
1905       node = order[i];
1906
1907       /* Handle nodes to be flattened.
1908          Ideally when processing callees we stop inlining at the
1909          entry of cycles, possibly cloning that entry point and
1910          try to flatten itself turning it into a self-recursive
1911          function.  */
1912       if (lookup_attribute ("flatten",
1913                             DECL_ATTRIBUTES (node->symbol.decl)) != NULL)
1914         {
1915           if (dump_file)
1916             fprintf (dump_file,
1917                      "Flattening %s\n", cgraph_node_name (node));
1918           flatten_function (node, false);
1919         }
1920     }
1921
1922   inline_small_functions ();
1923
1924   /* Do first after-inlining removal.  We want to remove all "stale" extern inline
1925      functions and virtual functions so we really know what is called once.  */
1926   symtab_remove_unreachable_nodes (false, dump_file);
1927   free (order);
1928
1929   /* Inline functions with a property that after inlining into all callers the
1930      code size will shrink because the out-of-line copy is eliminated.
1931      We do this regardless on the callee size as long as function growth limits
1932      are met.  */
1933   if (dump_file)
1934     fprintf (dump_file,
1935              "\nDeciding on functions to be inlined into all callers and removing useless speculations:\n");
1936
1937   /* Inlining one function called once has good chance of preventing
1938      inlining other function into the same callee.  Ideally we should
1939      work in priority order, but probably inlining hot functions first
1940      is good cut without the extra pain of maintaining the queue.
1941
1942      ??? this is not really fitting the bill perfectly: inlining function
1943      into callee often leads to better optimization of callee due to
1944      increased context for optimization.
1945      For example if main() function calls a function that outputs help
1946      and then function that does the main optmization, we should inline
1947      the second with priority even if both calls are cold by themselves.
1948
1949      We probably want to implement new predicate replacing our use of
1950      maybe_hot_edge interpreted as maybe_hot_edge || callee is known
1951      to be hot.  */
1952   for (cold = 0; cold <= 1; cold ++)
1953     {
1954       FOR_EACH_DEFINED_FUNCTION (node)
1955         {
1956           struct cgraph_edge *edge, *next;
1957           bool update=false;
1958
1959           for (edge = node->callees; edge; edge = next)
1960             {
1961               next = edge->next_callee;
1962               if (edge->speculative && !speculation_useful_p (edge, false))
1963                 {
1964                   cgraph_resolve_speculation (edge, NULL);
1965                   update = true;
1966                 }
1967             }
1968           if (update)
1969             {
1970               struct cgraph_node *where = node->global.inlined_to
1971                                           ? node->global.inlined_to : node;
1972               reset_node_growth_cache (where);
1973               reset_edge_caches (where);
1974               inline_update_overall_summary (where);
1975             }
1976           if (flag_inline_functions_called_once
1977               && want_inline_function_to_all_callers_p (node, cold))
1978             {
1979               int num_calls = 0;
1980               struct cgraph_edge *e;
1981               for (e = node->callers; e; e = e->next_caller)
1982                 num_calls++;
1983               while (node->callers && !node->global.inlined_to)
1984                 {
1985                   struct cgraph_node *caller = node->callers->caller;
1986
1987                   if (dump_file)
1988                     {
1989                       fprintf (dump_file,
1990                                "\nInlining %s size %i.\n",
1991                                cgraph_node_name (node),
1992                                inline_summary (node)->size);
1993                       fprintf (dump_file,
1994                                " Called once from %s %i insns.\n",
1995                                cgraph_node_name (node->callers->caller),
1996                                inline_summary (node->callers->caller)->size);
1997                     }
1998
1999                   inline_call (node->callers, true, NULL, NULL, true);
2000                   if (dump_file)
2001                     fprintf (dump_file,
2002                              " Inlined into %s which now has %i size\n",
2003                              cgraph_node_name (caller),
2004                              inline_summary (caller)->size);
2005                   if (!num_calls--)
2006                     {
2007                       if (dump_file)
2008                         fprintf (dump_file, "New calls found; giving up.\n");
2009                       break;
2010                     }
2011                 }
2012             }
2013         }
2014     }
2015
2016   /* Free ipa-prop structures if they are no longer needed.  */
2017   if (optimize)
2018     ipa_free_all_structures_after_iinln ();
2019
2020   if (dump_file)
2021     fprintf (dump_file,
2022              "\nInlined %i calls, eliminated %i functions\n\n",
2023              ncalls_inlined, nfunctions_inlined);
2024
2025   if (dump_file)
2026     dump_inline_summaries (dump_file);
2027   /* In WPA we use inline summaries for partitioning process.  */
2028   if (!flag_wpa)
2029     inline_free_summary ();
2030   return 0;
2031 }
2032
2033 /* Inline always-inline function calls in NODE.  */
2034
2035 static bool
2036 inline_always_inline_functions (struct cgraph_node *node)
2037 {
2038   struct cgraph_edge *e;
2039   bool inlined = false;
2040
2041   for (e = node->callees; e; e = e->next_callee)
2042     {
2043       struct cgraph_node *callee = cgraph_function_or_thunk_node (e->callee, NULL);
2044       if (!DECL_DISREGARD_INLINE_LIMITS (callee->symbol.decl))
2045         continue;
2046
2047       if (cgraph_edge_recursive_p (e))
2048         {
2049           if (dump_file)
2050             fprintf (dump_file, "  Not inlining recursive call to %s.\n",
2051                      cgraph_node_name (e->callee));
2052           e->inline_failed = CIF_RECURSIVE_INLINING;
2053           continue;
2054         }
2055
2056       if (!can_early_inline_edge_p (e))
2057         {
2058           /* Set inlined to true if the callee is marked "always_inline" but
2059              is not inlinable.  This will allow flagging an error later in
2060              expand_call_inline in tree-inline.c.  */
2061           if (lookup_attribute ("always_inline",
2062                                  DECL_ATTRIBUTES (callee->symbol.decl)) != NULL)
2063             inlined = true;
2064           continue;
2065         }
2066
2067       if (dump_file)
2068         fprintf (dump_file, "  Inlining %s into %s (always_inline).\n",
2069                  xstrdup (cgraph_node_name (e->callee)),
2070                  xstrdup (cgraph_node_name (e->caller)));
2071       inline_call (e, true, NULL, NULL, false);
2072       inlined = true;
2073     }
2074   if (inlined)
2075     inline_update_overall_summary (node);
2076
2077   return inlined;
2078 }
2079
2080 /* Decide on the inlining.  We do so in the topological order to avoid
2081    expenses on updating data structures.  */
2082
2083 static bool
2084 early_inline_small_functions (struct cgraph_node *node)
2085 {
2086   struct cgraph_edge *e;
2087   bool inlined = false;
2088
2089   for (e = node->callees; e; e = e->next_callee)
2090     {
2091       struct cgraph_node *callee = cgraph_function_or_thunk_node (e->callee, NULL);
2092       if (!inline_summary (callee)->inlinable
2093           || !e->inline_failed)
2094         continue;
2095
2096       /* Do not consider functions not declared inline.  */
2097       if (!DECL_DECLARED_INLINE_P (callee->symbol.decl)
2098           && !flag_inline_small_functions
2099           && !flag_inline_functions)
2100         continue;
2101
2102       if (dump_file)
2103         fprintf (dump_file, "Considering inline candidate %s.\n",
2104                  cgraph_node_name (callee));
2105
2106       if (!can_early_inline_edge_p (e))
2107         continue;
2108
2109       if (cgraph_edge_recursive_p (e))
2110         {
2111           if (dump_file)
2112             fprintf (dump_file, "  Not inlining: recursive call.\n");
2113           continue;
2114         }
2115
2116       if (!want_early_inline_function_p (e))
2117         continue;
2118
2119       if (dump_file)
2120         fprintf (dump_file, " Inlining %s into %s.\n",
2121                  xstrdup (cgraph_node_name (callee)),
2122                  xstrdup (cgraph_node_name (e->caller)));
2123       inline_call (e, true, NULL, NULL, true);
2124       inlined = true;
2125     }
2126
2127   return inlined;
2128 }
2129
2130 /* Do inlining of small functions.  Doing so early helps profiling and other
2131    passes to be somewhat more effective and avoids some code duplication in
2132    later real inlining pass for testcases with very many function calls.  */
2133 static unsigned int
2134 early_inliner (void)
2135 {
2136   struct cgraph_node *node = cgraph_get_node (current_function_decl);
2137   struct cgraph_edge *edge;
2138   unsigned int todo = 0;
2139   int iterations = 0;
2140   bool inlined = false;
2141
2142   if (seen_error ())
2143     return 0;
2144
2145   /* Do nothing if datastructures for ipa-inliner are already computed.  This
2146      happens when some pass decides to construct new function and
2147      cgraph_add_new_function calls lowering passes and early optimization on
2148      it.  This may confuse ourself when early inliner decide to inline call to
2149      function clone, because function clones don't have parameter list in
2150      ipa-prop matching their signature.  */
2151   if (ipa_node_params_vector.exists ())
2152     return 0;
2153
2154 #ifdef ENABLE_CHECKING
2155   verify_cgraph_node (node);
2156 #endif
2157   ipa_remove_all_references (&node->symbol.ref_list);
2158
2159   /* Even when not optimizing or not inlining inline always-inline
2160      functions.  */
2161   inlined = inline_always_inline_functions (node);
2162
2163   if (!optimize
2164       || flag_no_inline
2165       || !flag_early_inlining
2166       /* Never inline regular functions into always-inline functions
2167          during incremental inlining.  This sucks as functions calling
2168          always inline functions will get less optimized, but at the
2169          same time inlining of functions calling always inline
2170          function into an always inline function might introduce
2171          cycles of edges to be always inlined in the callgraph.
2172
2173          We might want to be smarter and just avoid this type of inlining.  */
2174       || DECL_DISREGARD_INLINE_LIMITS (node->symbol.decl))
2175     ;
2176   else if (lookup_attribute ("flatten",
2177                              DECL_ATTRIBUTES (node->symbol.decl)) != NULL)
2178     {
2179       /* When the function is marked to be flattened, recursively inline
2180          all calls in it.  */
2181       if (dump_file)
2182         fprintf (dump_file,
2183                  "Flattening %s\n", cgraph_node_name (node));
2184       flatten_function (node, true);
2185       inlined = true;
2186     }
2187   else
2188     {
2189       /* We iterate incremental inlining to get trivial cases of indirect
2190          inlining.  */
2191       while (iterations < PARAM_VALUE (PARAM_EARLY_INLINER_MAX_ITERATIONS)
2192              && early_inline_small_functions (node))
2193         {
2194           timevar_push (TV_INTEGRATION);
2195           todo |= optimize_inline_calls (current_function_decl);
2196
2197           /* Technically we ought to recompute inline parameters so the new
2198              iteration of early inliner works as expected.  We however have
2199              values approximately right and thus we only need to update edge
2200              info that might be cleared out for newly discovered edges.  */
2201           for (edge = node->callees; edge; edge = edge->next_callee)
2202             {
2203               struct inline_edge_summary *es = inline_edge_summary (edge);
2204               es->call_stmt_size
2205                 = estimate_num_insns (edge->call_stmt, &eni_size_weights);
2206               es->call_stmt_time
2207                 = estimate_num_insns (edge->call_stmt, &eni_time_weights);
2208               if (edge->callee->symbol.decl
2209                   && !gimple_check_call_matching_types (
2210                       edge->call_stmt, edge->callee->symbol.decl, false))
2211                 edge->call_stmt_cannot_inline_p = true;
2212             }
2213           timevar_pop (TV_INTEGRATION);
2214           iterations++;
2215           inlined = false;
2216         }
2217       if (dump_file)
2218         fprintf (dump_file, "Iterations: %i\n", iterations);
2219     }
2220
2221   if (inlined)
2222     {
2223       timevar_push (TV_INTEGRATION);
2224       todo |= optimize_inline_calls (current_function_decl);
2225       timevar_pop (TV_INTEGRATION);
2226     }
2227
2228   cfun->always_inline_functions_inlined = true;
2229
2230   return todo;
2231 }
2232
2233 namespace {
2234
2235 const pass_data pass_data_early_inline =
2236 {
2237   GIMPLE_PASS, /* type */
2238   "einline", /* name */
2239   OPTGROUP_INLINE, /* optinfo_flags */
2240   false, /* has_gate */
2241   true, /* has_execute */
2242   TV_EARLY_INLINING, /* tv_id */
2243   PROP_ssa, /* properties_required */
2244   0, /* properties_provided */
2245   0, /* properties_destroyed */
2246   0, /* todo_flags_start */
2247   0, /* todo_flags_finish */
2248 };
2249
2250 class pass_early_inline : public gimple_opt_pass
2251 {
2252 public:
2253   pass_early_inline(gcc::context *ctxt)
2254     : gimple_opt_pass(pass_data_early_inline, ctxt)
2255   {}
2256
2257   /* opt_pass methods: */
2258   unsigned int execute () { return early_inliner (); }
2259
2260 }; // class pass_early_inline
2261
2262 } // anon namespace
2263
2264 gimple_opt_pass *
2265 make_pass_early_inline (gcc::context *ctxt)
2266 {
2267   return new pass_early_inline (ctxt);
2268 }
2269
2270
2271 /* When to run IPA inlining.  Inlining of always-inline functions
2272    happens during early inlining.
2273
2274    Enable inlining unconditoinally at -flto.  We need size estimates to
2275    drive partitioning.  */
2276
2277 static bool
2278 gate_ipa_inline (void)
2279 {
2280   return optimize || flag_lto || flag_wpa;
2281 }
2282
2283 namespace {
2284
2285 const pass_data pass_data_ipa_inline =
2286 {
2287   IPA_PASS, /* type */
2288   "inline", /* name */
2289   OPTGROUP_INLINE, /* optinfo_flags */
2290   true, /* has_gate */
2291   true, /* has_execute */
2292   TV_IPA_INLINING, /* tv_id */
2293   0, /* properties_required */
2294   0, /* properties_provided */
2295   0, /* properties_destroyed */
2296   TODO_remove_functions, /* todo_flags_start */
2297   ( TODO_dump_symtab | TODO_remove_functions ), /* todo_flags_finish */
2298 };
2299
2300 class pass_ipa_inline : public ipa_opt_pass_d
2301 {
2302 public:
2303   pass_ipa_inline(gcc::context *ctxt)
2304     : ipa_opt_pass_d(pass_data_ipa_inline, ctxt,
2305                      inline_generate_summary, /* generate_summary */
2306                      inline_write_summary, /* write_summary */
2307                      inline_read_summary, /* read_summary */
2308                      NULL, /* write_optimization_summary */
2309                      NULL, /* read_optimization_summary */
2310                      NULL, /* stmt_fixup */
2311                      0, /* function_transform_todo_flags_start */
2312                      inline_transform, /* function_transform */
2313                      NULL) /* variable_transform */
2314   {}
2315
2316   /* opt_pass methods: */
2317   bool gate () { return gate_ipa_inline (); }
2318   unsigned int execute () { return ipa_inline (); }
2319
2320 }; // class pass_ipa_inline
2321
2322 } // anon namespace
2323
2324 ipa_opt_pass_d *
2325 make_pass_ipa_inline (gcc::context *ctxt)
2326 {
2327   return new pass_ipa_inline (ctxt);
2328 }