gcc/ipa-inline.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003, 2004 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 2, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING.  If not, write to the Free
  19 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
  20 02110-1301, USA.  */
  21
  22 /*  Inlining decision heuristics
  23
  24     We separate inlining decisions from the inliner itself and store it
  25     inside callgraph as so called inline plan.  Refer to cgraph.c
  26     documentation about particular representation of inline plans in the
  27     callgraph.
  28
  29     There are three major parts of this file:
  30
  31     cgraph_mark_inline implementation
  32
  33       This function allows to mark given call inline and performs necessary
  34       modifications of cgraph (production of the clones and updating overall
  35       statistics)
  36
  37     inlining heuristics limits
  38
  39       These functions allow to check that particular inlining is allowed
  40       by the limits specified by user (allowed function growth, overall unit
  41       growth and so on).
  42
  43     inlining heuristics
  44
  45       This is implementation of IPA pass aiming to get as much of benefit
  46       from inlining obeying the limits checked above.
  47
  48       The implementation of particular heuristics is separated from
  49       the rest of code to make it easier to replace it with more complicated
  50       implementation in the future.  The rest of inlining code acts as a
  51       library aimed to modify the callgraph and verify that the parameters
  52       on code size growth fits.
  53
  54       To mark given call inline, use cgraph_mark_inline function, the
  55       verification is performed by cgraph_default_inline_p and
  56       cgraph_check_inline_limits.
  57
  58       The heuristics implements simple knapsack style algorithm ordering
  59       all functions by their "profitability" (estimated by code size growth)
  60       and inlining them in priority order.
  61
  62       cgraph_decide_inlining implements heuristics taking whole callgraph
  63       into account, while cgraph_decide_inlining_incrementally considers
  64       only one function at a time and is used in non-unit-at-a-time mode.  */
  65
  66 #include "config.h"
  67 #include "system.h"
  68 #include "coretypes.h"
  69 #include "tm.h"
  70 #include "tree.h"
  71 #include "tree-inline.h"
  72 #include "langhooks.h"
  73 #include "flags.h"
  74 #include "cgraph.h"
  75 #include "diagnostic.h"
  76 #include "timevar.h"
  77 #include "params.h"
  78 #include "fibheap.h"
  79 #include "intl.h"
  80 #include "tree-pass.h"
  81 #include "hashtab.h"
  82 #include "coverage.h"
  83 #include "ggc.h"
  84
  85 /* Statistics we collect about inlining algorithm.  */
  86 static int ncalls_inlined;
  87 static int nfunctions_inlined;
  88 static int initial_insns;
  89 static int overall_insns;
  90 static int max_insns;
  91 static gcov_type max_count;
  92
  93 /* Estimate size of the function after inlining WHAT into TO.  */
  94
  95 static int
  96 cgraph_estimate_size_after_inlining (int times, struct cgraph_node *to,
  97                                      struct cgraph_node *what)
  98 {
  99   int size;
 100   tree fndecl = what->decl, arg;
 101   int call_insns = PARAM_VALUE (PARAM_INLINE_CALL_COST);
 102
 103   for (arg = DECL_ARGUMENTS (fndecl); arg; arg = TREE_CHAIN (arg))
 104     call_insns += estimate_move_cost (TREE_TYPE (arg));
 105   size = (what->global.insns - call_insns) * times + to->global.insns;
 106   gcc_assert (size >= 0);
 107   return size;
 108 }
 109
 110 /* E is expected to be an edge being inlined.  Clone destination node of
 111    the edge and redirect it to the new clone.
 112    DUPLICATE is used for bookkeeping on whether we are actually creating new
 113    clones or re-using node originally representing out-of-line function call.
 114    */
 115 void
 116 cgraph_clone_inlined_nodes (struct cgraph_edge *e, bool duplicate, bool update_original)
 117 {
 118   if (duplicate)
 119     {
 120       /* We may eliminate the need for out-of-line copy to be output.
 121          In that case just go ahead and re-use it.  */
 122       if (!e->callee->callers->next_caller
 123           && !e->callee->needed
 124           && flag_unit_at_a_time)
 125         {
 126           gcc_assert (!e->callee->global.inlined_to);
 127           if (DECL_SAVED_TREE (e->callee->decl))
 128             overall_insns -= e->callee->global.insns, nfunctions_inlined++;
 129           duplicate = false;
 130         }
 131       else
 132         {
 133           struct cgraph_node *n;
 134           n = cgraph_clone_node (e->callee, e->count, e->loop_nest,
 135                                  update_original);
 136           cgraph_redirect_edge_callee (e, n);
 137         }
 138     }
 139
 140   if (e->caller->global.inlined_to)
 141     e->callee->global.inlined_to = e->caller->global.inlined_to;
 142   else
 143     e->callee->global.inlined_to = e->caller;
 144
 145   /* Recursively clone all bodies.  */
 146   for (e = e->callee->callees; e; e = e->next_callee)
 147     if (!e->inline_failed)
 148       cgraph_clone_inlined_nodes (e, duplicate, update_original);
 149 }
 150
 151 /* Mark edge E as inlined and update callgraph accordingly.
 152    UPDATE_ORIGINAL specify whether profile of original function should be
 153    updated. */
 154
 155 void
 156 cgraph_mark_inline_edge (struct cgraph_edge *e, bool update_original)
 157 {
 158   int old_insns = 0, new_insns = 0;
 159   struct cgraph_node *to = NULL, *what;
 160
 161   if (e->callee->inline_decl)
 162     cgraph_redirect_edge_callee (e, cgraph_node (e->callee->inline_decl));
 163
 164   gcc_assert (e->inline_failed);
 165   e->inline_failed = NULL;
 166
 167   if (!e->callee->global.inlined && flag_unit_at_a_time)
 168     DECL_POSSIBLY_INLINED (e->callee->decl) = true;
 169   e->callee->global.inlined = true;
 170
 171   cgraph_clone_inlined_nodes (e, true, update_original);
 172
 173   what = e->callee;
 174
 175   /* Now update size of caller and all functions caller is inlined into.  */
 176   for (;e && !e->inline_failed; e = e->caller->callers)
 177     {
 178       old_insns = e->caller->global.insns;
 179       new_insns = cgraph_estimate_size_after_inlining (1, e->caller,
 180                                                        what);
 181       gcc_assert (new_insns >= 0);
 182       to = e->caller;
 183       to->global.insns = new_insns;
 184     }
 185   gcc_assert (what->global.inlined_to == to);
 186   if (new_insns > old_insns)
 187     overall_insns += new_insns - old_insns;
 188   ncalls_inlined++;
 189 }
 190
 191 /* Mark all calls of EDGE->CALLEE inlined into EDGE->CALLER.
 192    Return following unredirected edge in the list of callers
 193    of EDGE->CALLEE  */
 194
 195 static struct cgraph_edge *
 196 cgraph_mark_inline (struct cgraph_edge *edge)
 197 {
 198   struct cgraph_node *to = edge->caller;
 199   struct cgraph_node *what = edge->callee;
 200   struct cgraph_edge *e, *next;
 201   int times = 0;
 202
 203   /* Look for all calls, mark them inline and clone recursively
 204      all inlined functions.  */
 205   for (e = what->callers; e; e = next)
 206     {
 207       next = e->next_caller;
 208       if (e->caller == to && e->inline_failed)
 209         {
 210           cgraph_mark_inline_edge (e, true);
 211           if (e == edge)
 212             edge = next;
 213           times++;
 214         }
 215     }
 216   gcc_assert (times);
 217   return edge;
 218 }
 219
 220 /* Estimate the growth caused by inlining NODE into all callees.  */
 221
 222 static int
 223 cgraph_estimate_growth (struct cgraph_node *node)
 224 {
 225   int growth = 0;
 226   struct cgraph_edge *e;
 227   if (node->global.estimated_growth != INT_MIN)
 228     return node->global.estimated_growth;
 229
 230   for (e = node->callers; e; e = e->next_caller)
 231     if (e->inline_failed)
 232       growth += (cgraph_estimate_size_after_inlining (1, e->caller, node)
 233                  - e->caller->global.insns);
 234
 235   /* ??? Wrong for self recursive functions or cases where we decide to not
 236      inline for different reasons, but it is not big deal as in that case
 237      we will keep the body around, but we will also avoid some inlining.  */
 238   if (!node->needed && !DECL_EXTERNAL (node->decl))
 239     growth -= node->global.insns;
 240
 241   node->global.estimated_growth = growth;
 242   return growth;
 243 }
 244
 245 /* Return false when inlining WHAT into TO is not good idea
 246    as it would cause too large growth of function bodies.
 247    When ONE_ONLY is true, assume that only one call site is going
 248    to be inlined, otherwise figure out how many call sites in
 249    TO calls WHAT and verify that all can be inlined.
 250    */
 251
 252 static bool
 253 cgraph_check_inline_limits (struct cgraph_node *to, struct cgraph_node *what,
 254                             const char **reason, bool one_only)
 255 {
 256   int times = 0;
 257   struct cgraph_edge *e;
 258   int newsize;
 259   int limit;
 260
 261   if (one_only)
 262     times = 1;
 263   else
 264     for (e = to->callees; e; e = e->next_callee)
 265       if (e->callee == what)
 266         times++;
 267
 268   if (to->global.inlined_to)
 269     to = to->global.inlined_to;
 270
 271   /* When inlining large function body called once into small function,
 272      take the inlined function as base for limiting the growth.  */
 273   if (to->local.self_insns > what->local.self_insns)
 274     limit = to->local.self_insns;
 275   else
 276     limit = what->local.self_insns;
 277
 278   limit += limit * PARAM_VALUE (PARAM_LARGE_FUNCTION_GROWTH) / 100;
 279
 280   /* Check the size after inlining against the function limits.  But allow
 281      the function to shrink if it went over the limits by forced inlining.  */
 282   newsize = cgraph_estimate_size_after_inlining (times, to, what);
 283   if (newsize >= to->global.insns
 284       && newsize > PARAM_VALUE (PARAM_LARGE_FUNCTION_INSNS)
 285       && newsize > limit)
 286     {
 287       if (reason)
 288         *reason = N_("--param large-function-growth limit reached");
 289       return false;
 290     }
 291   return true;
 292 }
 293
 294 /* Return true when function N is small enough to be inlined.  */
 295
 296 bool
 297 cgraph_default_inline_p (struct cgraph_node *n, const char **reason)
 298 {
 299   tree decl = n->decl;
 300
 301   if (n->inline_decl)
 302     decl = n->inline_decl;
 303   if (!DECL_INLINE (decl))
 304     {
 305       if (reason)
 306         *reason = N_("function not inlinable");
 307       return false;
 308     }
 309
 310   if (!DECL_STRUCT_FUNCTION (decl)->cfg)
 311     {
 312       if (reason)
 313         *reason = N_("function body not available");
 314       return false;
 315     }
 316
 317   if (DECL_DECLARED_INLINE_P (decl))
 318     {
 319       if (n->global.insns >= MAX_INLINE_INSNS_SINGLE)
 320         {
 321           if (reason)
 322             *reason = N_("--param max-inline-insns-single limit reached");
 323           return false;
 324         }
 325     }
 326   else
 327     {
 328       if (n->global.insns >= MAX_INLINE_INSNS_AUTO)
 329         {
 330           if (reason)
 331             *reason = N_("--param max-inline-insns-auto limit reached");
 332           return false;
 333         }
 334     }
 335
 336   return true;
 337 }
 338
 339 /* Return true when inlining WHAT would create recursive inlining.
 340    We call recursive inlining all cases where same function appears more than
 341    once in the single recursion nest path in the inline graph.  */
 342
 343 static bool
 344 cgraph_recursive_inlining_p (struct cgraph_node *to,
 345                              struct cgraph_node *what,
 346                              const char **reason)
 347 {
 348   bool recursive;
 349   if (to->global.inlined_to)
 350     recursive = what->decl == to->global.inlined_to->decl;
 351   else
 352     recursive = what->decl == to->decl;
 353   /* Marking recursive function inline has sane semantic and thus we should
 354      not warn on it.  */
 355   if (recursive && reason)
 356     *reason = (what->local.disregard_inline_limits
 357                ? N_("recursive inlining") : "");
 358   return recursive;
 359 }
 360
 361 /* Return true if the call can be hot.  */
 362 static bool
 363 cgraph_maybe_hot_edge_p (struct cgraph_edge *edge)
 364 {
 365   if (profile_info && flag_branch_probabilities
 366       && (edge->count
 367           <= profile_info->sum_max / PARAM_VALUE (HOT_BB_COUNT_FRACTION)))
 368     return false;
 369   return true;
 370 }
 371
 372 /* A cost model driving the inlining heuristics in a way so the edges with
 373    smallest badness are inlined first.  After each inlining is performed
 374    the costs of all caller edges of nodes affected are recomputed so the
 375    metrics may accurately depend on values such as number of inlinable callers
 376    of the function or function body size.
 377
 378    With profiling we use number of executions of each edge to drive the cost.
 379    We also should distinguish hot and cold calls where the cold calls are
 380    inlined into only when code size is overall improved.
 381    */
 382
 383 static int
 384 cgraph_edge_badness (struct cgraph_edge *edge)
 385 {
 386   if (max_count)
 387     {
 388       int growth =
 389         cgraph_estimate_size_after_inlining (1, edge->caller, edge->callee);
 390       growth -= edge->caller->global.insns;
 391
 392       /* Always prefer inlining saving code size.  */
 393       if (growth <= 0)
 394         return INT_MIN - growth;
 395       return ((int)((double)edge->count * INT_MIN / max_count)) / growth;
 396     }
 397   else
 398   {
 399     int nest = MIN (edge->loop_nest, 8);
 400     int badness = cgraph_estimate_growth (edge->callee) * 256;
 401
 402     /* Decrease badness if call is nested.  */
 403     if (badness > 0)
 404       badness >>= nest;
 405     else
 406       badness <<= nest;
 407
 408     /* Make recursive inlining happen always after other inlining is done.  */
 409     if (cgraph_recursive_inlining_p (edge->caller, edge->callee, NULL))
 410       return badness + 1;
 411     else
 412       return badness;
 413   }
 414 }
 415
 416 /* Recompute heap nodes for each of caller edge.  */
 417
 418 static void
 419 update_caller_keys (fibheap_t heap, struct cgraph_node *node,
 420                     bitmap updated_nodes)
 421 {
 422   struct cgraph_edge *edge;
 423   const char *failed_reason;
 424
 425   if (!node->local.inlinable || node->local.disregard_inline_limits
 426       || node->global.inlined_to)
 427     return;
 428   if (bitmap_bit_p (updated_nodes, node->uid))
 429     return;
 430   bitmap_set_bit (updated_nodes, node->uid);
 431   node->global.estimated_growth = INT_MIN;
 432
 433   if (!node->local.inlinable)
 434     return;
 435   /* Prune out edges we won't inline into anymore.  */
 436   if (!cgraph_default_inline_p (node, &failed_reason))
 437     {
 438       for (edge = node->callers; edge; edge = edge->next_caller)
 439         if (edge->aux)
 440           {
 441             fibheap_delete_node (heap, edge->aux);
 442             edge->aux = NULL;
 443             if (edge->inline_failed)
 444               edge->inline_failed = failed_reason;
 445           }
 446       return;
 447     }
 448
 449   for (edge = node->callers; edge; edge = edge->next_caller)
 450     if (edge->inline_failed)
 451       {
 452         int badness = cgraph_edge_badness (edge);
 453         if (edge->aux)
 454           {
 455             fibnode_t n = edge->aux;
 456             gcc_assert (n->data == edge);
 457             if (n->key == badness)
 458               continue;
 459
 460             /* fibheap_replace_key only increase the keys.  */
 461             if (fibheap_replace_key (heap, n, badness))
 462               continue;
 463             fibheap_delete_node (heap, edge->aux);
 464           }
 465         edge->aux = fibheap_insert (heap, badness, edge);
 466       }
 467 }
 468
 469 /* Recompute heap nodes for each of caller edges of each of callees.  */
 470
 471 static void
 472 update_callee_keys (fibheap_t heap, struct cgraph_node *node,
 473                     bitmap updated_nodes)
 474 {
 475   struct cgraph_edge *e;
 476   node->global.estimated_growth = INT_MIN;
 477
 478   for (e = node->callees; e; e = e->next_callee)
 479     if (e->inline_failed)
 480       update_caller_keys (heap, e->callee, updated_nodes);
 481     else if (!e->inline_failed)
 482       update_callee_keys (heap, e->callee, updated_nodes);
 483 }
 484
 485 /* Enqueue all recursive calls from NODE into priority queue depending on
 486    how likely we want to recursively inline the call.  */
 487
 488 static void
 489 lookup_recursive_calls (struct cgraph_node *node, struct cgraph_node *where,
 490                         fibheap_t heap)
 491 {
 492   static int priority;
 493   struct cgraph_edge *e;
 494   for (e = where->callees; e; e = e->next_callee)
 495     if (e->callee == node)
 496       {
 497         /* When profile feedback is available, prioritize by expected number
 498            of calls.  Without profile feedback we maintain simple queue
 499            to order candidates via recursive depths.  */
 500         fibheap_insert (heap,
 501                         !max_count ? priority++
 502                         : -(e->count / ((max_count + (1<<24) - 1) / (1<<24))),
 503                         e);
 504       }
 505   for (e = where->callees; e; e = e->next_callee)
 506     if (!e->inline_failed)
 507       lookup_recursive_calls (node, e->callee, heap);
 508 }
 509
 510 /* Find callgraph nodes closing a circle in the graph.  The
 511    resulting hashtab can be used to avoid walking the circles.
 512    Uses the cgraph nodes ->aux field which needs to be zero
 513    before and will be zero after operation.  */
 514
 515 static void
 516 cgraph_find_cycles (struct cgraph_node *node, htab_t cycles)
 517 {
 518   struct cgraph_edge *e;
 519
 520   if (node->aux)
 521     {
 522       void **slot;
 523       slot = htab_find_slot (cycles, node, INSERT);
 524       if (!*slot)
 525         {
 526           if (dump_file)
 527             fprintf (dump_file, "Cycle contains %s\n", cgraph_node_name (node));
 528           *slot = node;
 529         }
 530       return;
 531     }
 532
 533   node->aux = node;
 534   for (e = node->callees; e; e = e->next_callee)
 535     cgraph_find_cycles (e->callee, cycles);
 536   node->aux = 0;
 537 }
 538
 539
 540 static void
 541 cgraph_apply_inline_plan (void)
 542 {
 543   struct cgraph_node *node;
 544   struct cgraph_node **order =
 545     xcalloc (cgraph_n_nodes, sizeof (struct cgraph_node *));
 546   int order_pos = 0, new_order_pos = 0;
 547   int i;
 548
 549   timevar_push (TV_INTEGRATION);
 550   order_pos = cgraph_postorder (order);
 551   gcc_assert (order_pos == cgraph_n_nodes);
 552
 553   /* Garbage collector may remove inline clones we eliminate during
 554      optimization.  So we must be sure to not reference them.  */
 555   for (i = 0; i < order_pos; i++)
 556     if (!order[i]->global.inlined_to)
 557       order[new_order_pos++] = order[i];
 558
 559   /* Initialize the default bitmap obstack.  */
 560   bitmap_obstack_initialize (NULL);
 561
 562
 563   for (i = 0; i < new_order_pos; i++)
 564     {
 565       struct cgraph_edge *e;
 566
 567       node = order[i];
 568       for (e = node->callees; e; e = e->next_callee)
 569         if (!e->inline_failed || warn_inline)
 570           break;
 571       if (e)
 572         {
 573           if (cgraph_preserve_function_body_p (node->decl, true))
 574             save_inline_function_body (node);
 575           push_cfun (DECL_STRUCT_FUNCTION (node->decl));
 576           tree_register_cfg_hooks ();
 577           current_function_decl = node->decl;
 578           optimize_inline_calls (node->decl, false);
 579           free_dominance_info (CDI_DOMINATORS);
 580           free_dominance_info (CDI_POST_DOMINATORS);
 581           node->local.self_insns = node->global.insns;
 582           pop_cfun ();
 583           ggc_collect ();
 584         }
 585     }
 586   free (order);
 587   cfun = NULL;
 588   timevar_pop (TV_INTEGRATION);
 589 }
 590
 591 /* Leafify the cgraph node.  We have to be careful in recursing
 592    as to not run endlessly in circles of the callgraph.
 593    We do so by using a hashtab of cycle entering nodes as generated
 594    by cgraph_find_cycles.  */
 595
 596 static void
 597 cgraph_flatten_node (struct cgraph_node *node, htab_t cycles)
 598 {
 599   struct cgraph_edge *e;
 600
 601   for (e = node->callees; e; e = e->next_callee)
 602     {
 603       /* Inline call, if possible, and recurse.  Be sure we are not
 604          entering callgraph circles here.  */
 605       if (e->inline_failed
 606           && e->callee->local.inlinable
 607           && !cgraph_recursive_inlining_p (node, e->callee,
 608                                            &e->inline_failed)
 609           && !htab_find (cycles, e->callee))
 610         {
 611           if (dump_file)
 612             fprintf (dump_file, " inlining %s", cgraph_node_name (e->callee));
 613           cgraph_mark_inline_edge (e, true);
 614           cgraph_flatten_node (e->callee, cycles);
 615         }
 616       else if (dump_file)
 617         fprintf (dump_file, " !inlining %s", cgraph_node_name (e->callee));
 618     }
 619 }
 620
 621 /* Decide on recursive inlining: in the case function has recursive calls,
 622    inline until body size reaches given argument.  */
 623
 624 static bool
 625 cgraph_decide_recursive_inlining (struct cgraph_node *node)
 626 {
 627   int limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE_AUTO);
 628   int max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH_AUTO);
 629   int probability = PARAM_VALUE (PARAM_MIN_INLINE_RECURSIVE_PROBABILITY);
 630   fibheap_t heap;
 631   struct cgraph_edge *e;
 632   struct cgraph_node *master_clone, *next;
 633   int depth = 0;
 634   int n = 0;
 635
 636   if (DECL_DECLARED_INLINE_P (node->decl))
 637     {
 638       limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE);
 639       max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH);
 640     }
 641
 642   /* Make sure that function is small enough to be considered for inlining.  */
 643   if (!max_depth
 644       || cgraph_estimate_size_after_inlining (1, node, node)  >= limit)
 645     return false;
 646   heap = fibheap_new ();
 647   lookup_recursive_calls (node, node, heap);
 648   if (fibheap_empty (heap))
 649     {
 650       fibheap_delete (heap);
 651       return false;
 652     }
 653
 654   if (dump_file)
 655     fprintf (dump_file,
 656              "  Performing recursive inlining on %s\n",
 657              cgraph_node_name (node));
 658
 659   /* We need original clone to copy around.  */
 660   master_clone = cgraph_clone_node (node, node->count, 1, false);
 661   master_clone->needed = true;
 662   for (e = master_clone->callees; e; e = e->next_callee)
 663     if (!e->inline_failed)
 664       cgraph_clone_inlined_nodes (e, true, false);
 665
 666   /* Do the inlining and update list of recursive call during process.  */
 667   while (!fibheap_empty (heap)
 668          && (cgraph_estimate_size_after_inlining (1, node, master_clone)
 669              <= limit))
 670     {
 671       struct cgraph_edge *curr = fibheap_extract_min (heap);
 672       struct cgraph_node *cnode;
 673
 674       depth = 1;
 675       for (cnode = curr->caller;
 676            cnode->global.inlined_to; cnode = cnode->callers->caller)
 677         if (node->decl == curr->callee->decl)
 678           depth++;
 679       if (depth > max_depth)
 680         {
 681           if (dump_file)
 682             fprintf (dump_file,
 683                      "   maxmal depth reached\n");
 684           continue;
 685         }
 686
 687       if (max_count)
 688         {
 689           if (!cgraph_maybe_hot_edge_p (curr))
 690             {
 691               if (dump_file)
 692                 fprintf (dump_file, "   Not inlining cold call\n");
 693               continue;
 694             }
 695           if (curr->count * 100 / node->count < probability)
 696             {
 697               if (dump_file)
 698                 fprintf (dump_file,
 699                          "   Probability of edge is too small\n");
 700               continue;
 701             }
 702         }
 703
 704       if (dump_file)
 705         {
 706           fprintf (dump_file,
 707                    "   Inlining call of depth %i", depth);
 708           if (node->count)
 709             {
 710               fprintf (dump_file, " called approx. %.2f times per call",
 711                        (double)curr->count / node->count);
 712             }
 713           fprintf (dump_file, "\n");
 714         }
 715       cgraph_redirect_edge_callee (curr, master_clone);
 716       cgraph_mark_inline_edge (curr, false);
 717       lookup_recursive_calls (node, curr->callee, heap);
 718       n++;
 719     }
 720   if (!fibheap_empty (heap) && dump_file)
 721     fprintf (dump_file, "    Recursive inlining growth limit met.\n");
 722
 723   fibheap_delete (heap);
 724   if (dump_file)
 725     fprintf (dump_file,
 726              "\n   Inlined %i times, body grown from %i to %i insns\n", n,
 727              master_clone->global.insns, node->global.insns);
 728
 729   /* Remove master clone we used for inlining.  We rely that clones inlined
 730      into master clone gets queued just before master clone so we don't
 731      need recursion.  */
 732   for (node = cgraph_nodes; node != master_clone;
 733        node = next)
 734     {
 735       next = node->next;
 736       if (node->global.inlined_to == master_clone)
 737         cgraph_remove_node (node);
 738     }
 739   cgraph_remove_node (master_clone);
 740   /* FIXME: Recursive inlining actually reduces number of calls of the
 741      function.  At this place we should probably walk the function and
 742      inline clones and compensate the counts accordingly.  This probably
 743      doesn't matter much in practice.  */
 744   return n > 0;
 745 }
 746
 747 /* Set inline_failed for all callers of given function to REASON.  */
 748
 749 static void
 750 cgraph_set_inline_failed (struct cgraph_node *node, const char *reason)
 751 {
 752   struct cgraph_edge *e;
 753
 754   if (dump_file)
 755     fprintf (dump_file, "Inlining failed: %s\n", reason);
 756   for (e = node->callers; e; e = e->next_caller)
 757     if (e->inline_failed)
 758       e->inline_failed = reason;
 759 }
 760
 761 /* We use greedy algorithm for inlining of small functions:
 762    All inline candidates are put into prioritized heap based on estimated
 763    growth of the overall number of instructions and then update the estimates.
 764
 765    INLINED and INLINED_CALEES are just pointers to arrays large enough
 766    to be passed to cgraph_inlined_into and cgraph_inlined_callees.  */
 767
 768 static void
 769 cgraph_decide_inlining_of_small_functions (void)
 770 {
 771   struct cgraph_node *node;
 772   struct cgraph_edge *edge;
 773   const char *failed_reason;
 774   fibheap_t heap = fibheap_new ();
 775   bitmap updated_nodes = BITMAP_ALLOC (NULL);
 776
 777   if (dump_file)
 778     fprintf (dump_file, "\nDeciding on smaller functions:\n");
 779
 780   /* Put all inline candidates into the heap.  */
 781
 782   for (node = cgraph_nodes; node; node = node->next)
 783     {
 784       if (!node->local.inlinable || !node->callers
 785           || node->local.disregard_inline_limits)
 786         continue;
 787       if (dump_file)
 788         fprintf (dump_file, "Considering inline candidate %s.\n", cgraph_node_name (node));
 789
 790       node->global.estimated_growth = INT_MIN;
 791       if (!cgraph_default_inline_p (node, &failed_reason))
 792         {
 793           cgraph_set_inline_failed (node, failed_reason);
 794           continue;
 795         }
 796
 797       for (edge = node->callers; edge; edge = edge->next_caller)
 798         if (edge->inline_failed)
 799           {
 800             gcc_assert (!edge->aux);
 801             edge->aux = fibheap_insert (heap, cgraph_edge_badness (edge), edge);
 802           }
 803     }
 804   while (overall_insns <= max_insns && (edge = fibheap_extract_min (heap)))
 805     {
 806       int old_insns = overall_insns;
 807       struct cgraph_node *where;
 808       int growth =
 809         cgraph_estimate_size_after_inlining (1, edge->caller, edge->callee);
 810
 811       growth -= edge->caller->global.insns;
 812
 813       if (dump_file)
 814         {
 815           fprintf (dump_file,
 816                    "\nConsidering %s with %i insns\n",
 817                    cgraph_node_name (edge->callee),
 818                    edge->callee->global.insns);
 819           fprintf (dump_file,
 820                    " to be inlined into %s\n"
 821                    " Estimated growth after inlined into all callees is %+i insns.\n"
 822                    " Estimated badness is %i.\n",
 823                    cgraph_node_name (edge->caller),
 824                    cgraph_estimate_growth (edge->callee),
 825                    cgraph_edge_badness (edge));
 826           if (edge->count)
 827             fprintf (dump_file," Called "HOST_WIDEST_INT_PRINT_DEC"x\n", edge->count);
 828         }
 829       gcc_assert (edge->aux);
 830       edge->aux = NULL;
 831       if (!edge->inline_failed)
 832         continue;
 833
 834       /* When not having profile info ready we don't weight by any way the
 835          position of call in procedure itself.  This means if call of
 836          function A from function B seems profitable to inline, the recursive
 837          call of function A in inline copy of A in B will look profitable too
 838          and we end up inlining until reaching maximal function growth.  This
 839          is not good idea so prohibit the recursive inlining.
 840
 841          ??? When the frequencies are taken into account we might not need this
 842          restriction.   */
 843       if (!max_count)
 844         {
 845           where = edge->caller;
 846           while (where->global.inlined_to)
 847             {
 848               if (where->decl == edge->callee->decl)
 849                 break;
 850               where = where->callers->caller;
 851             }
 852           if (where->global.inlined_to)
 853             {
 854               edge->inline_failed
 855                 = (edge->callee->local.disregard_inline_limits ? N_("recursive inlining") : "");
 856               if (dump_file)
 857                 fprintf (dump_file, " inline_failed:Recursive inlining performed only for function itself.\n");
 858               continue;
 859             }
 860         }
 861
 862       if (!cgraph_maybe_hot_edge_p (edge) && growth > 0)
 863         {
 864           if (!cgraph_recursive_inlining_p (edge->caller, edge->callee,
 865                                             &edge->inline_failed))
 866             {
 867               edge->inline_failed =
 868                 N_("call is unlikely");
 869               if (dump_file)
 870                 fprintf (dump_file, " inline_failed:%s.\n", edge->inline_failed);
 871             }
 872           continue;
 873         }
 874       if (!cgraph_default_inline_p (edge->callee, &edge->inline_failed))
 875         {
 876           if (!cgraph_recursive_inlining_p (edge->caller, edge->callee,
 877                                             &edge->inline_failed))
 878             {
 879               if (dump_file)
 880                 fprintf (dump_file, " inline_failed:%s.\n", edge->inline_failed);
 881             }
 882           continue;
 883         }
 884       if (cgraph_recursive_inlining_p (edge->caller, edge->callee,
 885                                        &edge->inline_failed))
 886         {
 887           where = edge->caller;
 888           if (where->global.inlined_to)
 889             where = where->global.inlined_to;
 890           if (!cgraph_decide_recursive_inlining (where))
 891             continue;
 892           update_callee_keys (heap, where, updated_nodes);
 893         }
 894       else
 895         {
 896           struct cgraph_node *callee;
 897           if (!cgraph_check_inline_limits (edge->caller, edge->callee,
 898                                            &edge->inline_failed, true))
 899             {
 900               if (dump_file)
 901                 fprintf (dump_file, " Not inlining into %s:%s.\n",
 902                          cgraph_node_name (edge->caller), edge->inline_failed);
 903               continue;
 904             }
 905           callee = edge->callee;
 906           cgraph_mark_inline_edge (edge, true);
 907           update_callee_keys (heap, callee, updated_nodes);
 908         }
 909       where = edge->caller;
 910       if (where->global.inlined_to)
 911         where = where->global.inlined_to;
 912
 913       /* Our profitability metric can depend on local properties
 914          such as number of inlinable calls and size of the function body.
 915          After inlining these properties might change for the function we
 916          inlined into (since it's body size changed) and for the functions
 917          called by function we inlined (since number of it inlinable callers
 918          might change).  */
 919       update_caller_keys (heap, where, updated_nodes);
 920       bitmap_clear (updated_nodes);
 921
 922       if (dump_file)
 923         {
 924           fprintf (dump_file,
 925                    " Inlined into %s which now has %i insns,"
 926                    "net change of %+i insns.\n",
 927                    cgraph_node_name (edge->caller),
 928                    edge->caller->global.insns,
 929                    overall_insns - old_insns);
 930         }
 931     }
 932   while ((edge = fibheap_extract_min (heap)) != NULL)
 933     {
 934       gcc_assert (edge->aux);
 935       edge->aux = NULL;
 936       if (!edge->callee->local.disregard_inline_limits && edge->inline_failed
 937           && !cgraph_recursive_inlining_p (edge->caller, edge->callee,
 938                                            &edge->inline_failed))
 939         edge->inline_failed = N_("--param inline-unit-growth limit reached");
 940     }
 941   fibheap_delete (heap);
 942   BITMAP_FREE (updated_nodes);
 943 }
 944
 945 /* Decide on the inlining.  We do so in the topological order to avoid
 946    expenses on updating data structures.  */
 947
 948 static unsigned int
 949 cgraph_decide_inlining (void)
 950 {
 951   struct cgraph_node *node;
 952   int nnodes;
 953   struct cgraph_node **order =
 954     XCNEWVEC (struct cgraph_node *, cgraph_n_nodes);
 955   int old_insns = 0;
 956   int i;
 957
 958   timevar_push (TV_INLINE_HEURISTICS);
 959   max_count = 0;
 960   for (node = cgraph_nodes; node; node = node->next)
 961     if (node->analyzed && (node->needed || node->reachable))
 962       {
 963         struct cgraph_edge *e;
 964
 965         /* At the moment, no IPA passes change function bodies before inlining.
 966            Save some time by not recomputing function body sizes if early inlining
 967            already did so.  */
 968         if (!flag_early_inlining)
 969           node->local.self_insns = node->global.insns
 970              = estimate_num_insns (node->decl);
 971
 972         initial_insns += node->local.self_insns;
 973         gcc_assert (node->local.self_insns == node->global.insns);
 974         for (e = node->callees; e; e = e->next_callee)
 975           if (max_count < e->count)
 976             max_count = e->count;
 977       }
 978   overall_insns = initial_insns;
 979   gcc_assert (!max_count || (profile_info && flag_branch_probabilities));
 980
 981   max_insns = overall_insns;
 982   if (max_insns < PARAM_VALUE (PARAM_LARGE_UNIT_INSNS))
 983     max_insns = PARAM_VALUE (PARAM_LARGE_UNIT_INSNS);
 984
 985   max_insns = ((HOST_WIDEST_INT) max_insns
 986                * (100 + PARAM_VALUE (PARAM_INLINE_UNIT_GROWTH)) / 100);
 987
 988   nnodes = cgraph_postorder (order);
 989
 990   if (dump_file)
 991     fprintf (dump_file,
 992              "\nDeciding on inlining.  Starting with %i insns.\n",
 993              initial_insns);
 994
 995   for (node = cgraph_nodes; node; node = node->next)
 996     node->aux = 0;
 997
 998   if (dump_file)
 999     fprintf (dump_file, "\nInlining always_inline functions:\n");
1000
1001   /* In the first pass mark all always_inline edges.  Do this with a priority
1002      so none of our later choices will make this impossible.  */
1003   for (i = nnodes - 1; i >= 0; i--)
1004     {
1005       struct cgraph_edge *e, *next;
1006
1007       node = order[i];
1008
1009       /* Handle nodes to be flattened, but don't update overall unit size.  */
1010       if (lookup_attribute ("flatten", DECL_ATTRIBUTES (node->decl)) != NULL)
1011         {
1012           int old_overall_insns = overall_insns;
1013           htab_t cycles;
1014           if (dump_file)
1015             fprintf (dump_file,
1016                      "Leafifying %s\n", cgraph_node_name (node));
1017           cycles = htab_create (7, htab_hash_pointer, htab_eq_pointer, NULL);
1018           cgraph_find_cycles (node, cycles);
1019           cgraph_flatten_node (node, cycles);
1020           htab_delete (cycles);
1021           overall_insns = old_overall_insns;
1022           /* We don't need to consider always_inline functions inside the flattened
1023              function anymore.  */
1024           continue;
1025         }
1026
1027       if (!node->local.disregard_inline_limits)
1028         continue;
1029       if (dump_file)
1030         fprintf (dump_file,
1031                  "\nConsidering %s %i insns (always inline)\n",
1032                  cgraph_node_name (node), node->global.insns);
1033       old_insns = overall_insns;
1034       for (e = node->callers; e; e = next)
1035         {
1036           next = e->next_caller;
1037           if (!e->inline_failed)
1038             continue;
1039           if (cgraph_recursive_inlining_p (e->caller, e->callee,
1040                                            &e->inline_failed))
1041             continue;
1042           cgraph_mark_inline_edge (e, true);
1043           if (dump_file)
1044             fprintf (dump_file,
1045                      " Inlined into %s which now has %i insns.\n",
1046                      cgraph_node_name (e->caller),
1047                      e->caller->global.insns);
1048         }
1049       if (dump_file)
1050         fprintf (dump_file,
1051                  " Inlined for a net change of %+i insns.\n",
1052                  overall_insns - old_insns);
1053     }
1054
1055   if (!flag_really_no_inline)
1056     cgraph_decide_inlining_of_small_functions ();
1057
1058   if (!flag_really_no_inline
1059       && flag_inline_functions_called_once)
1060     {
1061       if (dump_file)
1062         fprintf (dump_file, "\nDeciding on functions called once:\n");
1063
1064       /* And finally decide what functions are called once.  */
1065
1066       for (i = nnodes - 1; i >= 0; i--)
1067         {
1068           node = order[i];
1069
1070           if (node->callers && !node->callers->next_caller && !node->needed
1071               && node->local.inlinable && node->callers->inline_failed
1072               && !DECL_EXTERNAL (node->decl) && !DECL_COMDAT (node->decl))
1073             {
1074               bool ok = true;
1075               struct cgraph_node *node1;
1076
1077               /* Verify that we won't duplicate the caller.  */
1078               for (node1 = node->callers->caller;
1079                    node1->callers && !node1->callers->inline_failed
1080                    && ok; node1 = node1->callers->caller)
1081                 if (node1->callers->next_caller || node1->needed)
1082                   ok = false;
1083               if (ok)
1084                 {
1085                   if (dump_file)
1086                     {
1087                       fprintf (dump_file,
1088                                "\nConsidering %s %i insns.\n",
1089                                cgraph_node_name (node), node->global.insns);
1090                       fprintf (dump_file,
1091                                " Called once from %s %i insns.\n",
1092                                cgraph_node_name (node->callers->caller),
1093                                node->callers->caller->global.insns);
1094                     }
1095
1096                   old_insns = overall_insns;
1097
1098                   if (cgraph_check_inline_limits (node->callers->caller, node,
1099                                                   NULL, false))
1100                     {
1101                       cgraph_mark_inline (node->callers);
1102                       if (dump_file)
1103                         fprintf (dump_file,
1104                                  " Inlined into %s which now has %i insns"
1105                                  " for a net change of %+i insns.\n",
1106                                  cgraph_node_name (node->callers->caller),
1107                                  node->callers->caller->global.insns,
1108                                  overall_insns - old_insns);
1109                     }
1110                   else
1111                     {
1112                       if (dump_file)
1113                         fprintf (dump_file,
1114                                  " Inline limit reached, not inlined.\n");
1115                     }
1116                 }
1117             }
1118         }
1119     }
1120
1121   cgraph_remove_unreachable_nodes (false, dump_file);
1122   cgraph_apply_inline_plan ();
1123   cgraph_remove_unreachable_nodes (false, dump_file);
1124
1125   if (dump_file)
1126     fprintf (dump_file,
1127              "\nInlined %i calls, eliminated %i functions, "
1128              "%i insns turned to %i insns.\n\n",
1129              ncalls_inlined, nfunctions_inlined, initial_insns,
1130              overall_insns);
1131   free (order);
1132   timevar_pop (TV_INLINE_HEURISTICS);
1133   return 0;
1134 }
1135
1136 /* Decide on the inlining.  We do so in the topological order to avoid
1137    expenses on updating data structures.  */
1138
1139 bool
1140 cgraph_decide_inlining_incrementally (struct cgraph_node *node, bool early)
1141 {
1142   struct cgraph_edge *e;
1143   bool inlined = false;
1144   const char *failed_reason;
1145
1146   /* First of all look for always inline functions.  */
1147   for (e = node->callees; e; e = e->next_callee)
1148     if (e->callee->local.disregard_inline_limits
1149         && e->inline_failed
1150         && !cgraph_recursive_inlining_p (node, e->callee, &e->inline_failed)
1151         /* ??? It is possible that renaming variable removed the function body
1152            in duplicate_decls. See gcc.c-torture/compile/20011119-2.c  */
1153         && (DECL_SAVED_TREE (e->callee->decl) || e->callee->inline_decl))
1154       {
1155         if (dump_file && early)
1156           {
1157             fprintf (dump_file, "  Early inlining %s",
1158                      cgraph_node_name (e->callee));
1159             fprintf (dump_file, " into %s\n", cgraph_node_name (node));
1160           }
1161         cgraph_mark_inline (e);
1162         inlined = true;
1163       }
1164
1165   /* Now do the automatic inlining.  */
1166   if (!flag_really_no_inline)
1167     for (e = node->callees; e; e = e->next_callee)
1168       if (e->callee->local.inlinable
1169           && e->inline_failed
1170           && !e->callee->local.disregard_inline_limits
1171           && !cgraph_recursive_inlining_p (node, e->callee, &e->inline_failed)
1172           && (!early
1173               || (cgraph_estimate_size_after_inlining (1, e->caller, e->callee)
1174                   <= e->caller->global.insns))
1175           && cgraph_check_inline_limits (node, e->callee, &e->inline_failed,
1176                                          false)
1177           && (DECL_SAVED_TREE (e->callee->decl) || e->callee->inline_decl))
1178         {
1179           if (cgraph_default_inline_p (e->callee, &failed_reason))
1180             {
1181               if (dump_file && early)
1182                 {
1183                   fprintf (dump_file, "  Early inlining %s",
1184                            cgraph_node_name (e->callee));
1185                   fprintf (dump_file, " into %s\n", cgraph_node_name (node));
1186                 }
1187               cgraph_mark_inline (e);
1188               inlined = true;
1189             }
1190           else if (!early)
1191             e->inline_failed = failed_reason;
1192         }
1193   if (inlined || (warn_inline && !early))
1194     {
1195       /* Initialize the default bitmap obstack.  */
1196       bitmap_obstack_initialize (NULL);
1197       push_cfun (DECL_STRUCT_FUNCTION (node->decl));
1198       tree_register_cfg_hooks ();
1199       current_function_decl = node->decl;
1200       optimize_inline_calls (current_function_decl, early);
1201       free_dominance_info (CDI_DOMINATORS);
1202       free_dominance_info (CDI_POST_DOMINATORS);
1203       node->local.self_insns = node->global.insns;
1204       current_function_decl = NULL;
1205       pop_cfun ();
1206     }
1207   return inlined;
1208 }
1209
1210 /* When inlining shall be performed.  */
1211 static bool
1212 cgraph_gate_inlining (void)
1213 {
1214   return flag_inline_trees /*&& 0*/;
1215 }
1216
1217 struct tree_opt_pass pass_ipa_inline =
1218 {
1219   "inline",                             /* name */
1220   cgraph_gate_inlining,                 /* gate */
1221   cgraph_decide_inlining,               /* execute */
1222   NULL,                                 /* sub */
1223   NULL,                                 /* next */
1224   0,                                    /* static_pass_number */
1225   TV_INTEGRATION,                       /* tv_id */
1226   0,                                    /* properties_required */
1227   PROP_cfg,                             /* properties_provided */
1228   0,                                    /* properties_destroyed */
1229   0,                                    /* todo_flags_start */
1230   TODO_dump_cgraph | TODO_dump_func,    /* todo_flags_finish */
1231   0                                     /* letter */
1232 };
1233
1234 /* Because inlining might remove no-longer reachable nodes, we need to
1235    keep the array visible to garbage collector to avoid reading collected
1236    out nodes.  */
1237 static int nnodes;
1238 static GTY ((length ("nnodes"))) struct cgraph_node **order;
1239
1240 /* Do inlining of small functions.  Doing so early helps profiling and other
1241    passes to be somewhat more effective and avoids some code duplication in
1242    later real inlining pass for testcases with very many function calls.  */
1243 static unsigned int
1244 cgraph_early_inlining (void)
1245 {
1246   struct cgraph_node *node;
1247   int i;
1248
1249   if (sorrycount || errorcount)
1250     return 0;
1251 #ifdef ENABLE_CHECKING
1252   for (node = cgraph_nodes; node; node = node->next)
1253     gcc_assert (!node->aux);
1254 #endif
1255
1256   order = ggc_alloc (sizeof (*order) * cgraph_n_nodes);
1257   nnodes = cgraph_postorder (order);
1258   for (i = nnodes - 1; i >= 0; i--)
1259     {
1260       node = order[i];
1261       if (node->analyzed && (node->needed || node->reachable))
1262         node->local.self_insns = node->global.insns
1263           = estimate_num_insns (node->decl);
1264     }
1265   for (i = nnodes - 1; i >= 0; i--)
1266     {
1267       node = order[i];
1268       if (node->analyzed && node->local.inlinable
1269           && (node->needed || node->reachable)
1270           && node->callers)
1271         {
1272           if (cgraph_decide_inlining_incrementally (node, true))
1273             ggc_collect ();
1274         }
1275     }
1276   cgraph_remove_unreachable_nodes (true, dump_file);
1277 #ifdef ENABLE_CHECKING
1278   for (node = cgraph_nodes; node; node = node->next)
1279     gcc_assert (!node->global.inlined_to);
1280 #endif
1281   ggc_free (order);
1282   order = NULL;
1283   nnodes = 0;
1284   return 0;
1285 }
1286
1287 /* When inlining shall be performed.  */
1288 static bool
1289 cgraph_gate_early_inlining (void)
1290 {
1291   return flag_inline_trees && flag_early_inlining;
1292 }
1293
1294 struct tree_opt_pass pass_early_ipa_inline =
1295 {
1296   "einline",                            /* name */
1297   cgraph_gate_early_inlining,           /* gate */
1298   cgraph_early_inlining,                /* execute */
1299   NULL,                                 /* sub */
1300   NULL,                                 /* next */
1301   0,                                    /* static_pass_number */
1302   TV_INTEGRATION,                       /* tv_id */
1303   0,                                    /* properties_required */
1304   PROP_cfg,                             /* properties_provided */
1305   0,                                    /* properties_destroyed */
1306   0,                                    /* todo_flags_start */
1307   TODO_dump_cgraph | TODO_dump_func,    /* todo_flags_finish */
1308   0                                     /* letter */
1309 };
1310
1311 #include "gt-ipa-inline.h"