gcc/ipa-inline.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003, 2004 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 2, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING.  If not, write to the Free
  19 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
  20 02110-1301, USA.  */
  21
  22 /*  Inlining decision heuristics
  23
  24     We separate inlining decisions from the inliner itself and store it
  25     inside callgraph as so called inline plan.  Refer to cgraph.c
  26     documentation about particular representation of inline plans in the
  27     callgraph.
  28
  29     There are three major parts of this file:
  30
  31     cgraph_mark_inline implementation
  32
  33       This function allows to mark given call inline and performs necessary
  34       modifications of cgraph (production of the clones and updating overall
  35       statistics)
  36
  37     inlining heuristics limits
  38
  39       These functions allow to check that particular inlining is allowed
  40       by the limits specified by user (allowed function growth, overall unit
  41       growth and so on).
  42
  43     inlining heuristics
  44
  45       This is implementation of IPA pass aiming to get as much of benefit
  46       from inlining obeying the limits checked above.
  47
  48       The implementation of particular heuristics is separated from
  49       the rest of code to make it easier to replace it with more complicated
  50       implementation in the future.  The rest of inlining code acts as a
  51       library aimed to modify the callgraph and verify that the parameters
  52       on code size growth fits.
  53
  54       To mark given call inline, use cgraph_mark_inline function, the
  55       verification is performed by cgraph_default_inline_p and
  56       cgraph_check_inline_limits.
  57
  58       The heuristics implements simple knapsack style algorithm ordering
  59       all functions by their "profitability" (estimated by code size growth)
  60       and inlining them in priority order.
  61
  62       cgraph_decide_inlining implements heuristics taking whole callgraph
  63       into account, while cgraph_decide_inlining_incrementally considers
  64       only one function at a time and is used in non-unit-at-a-time mode.  */
  65
  66 #include "config.h"
  67 #include "system.h"
  68 #include "coretypes.h"
  69 #include "tm.h"
  70 #include "tree.h"
  71 #include "tree-inline.h"
  72 #include "langhooks.h"
  73 #include "flags.h"
  74 #include "cgraph.h"
  75 #include "diagnostic.h"
  76 #include "timevar.h"
  77 #include "params.h"
  78 #include "fibheap.h"
  79 #include "intl.h"
  80 #include "tree-pass.h"
  81 #include "hashtab.h"
  82 #include "coverage.h"
  83 #include "ggc.h"
  84
  85 /* Statistics we collect about inlining algorithm.  */
  86 static int ncalls_inlined;
  87 static int nfunctions_inlined;
  88 static int initial_insns;
  89 static int overall_insns;
  90 static int max_insns;
  91 static gcov_type max_count;
  92
  93 /* Estimate size of the function after inlining WHAT into TO.  */
  94
  95 static int
  96 cgraph_estimate_size_after_inlining (int times, struct cgraph_node *to,
  97                                      struct cgraph_node *what)
  98 {
  99   int size;
 100   tree fndecl = what->decl, arg;
 101   int call_insns = PARAM_VALUE (PARAM_INLINE_CALL_COST);
 102
 103   for (arg = DECL_ARGUMENTS (fndecl); arg; arg = TREE_CHAIN (arg))
 104     call_insns += estimate_move_cost (TREE_TYPE (arg));
 105   size = (what->global.insns - call_insns) * times + to->global.insns;
 106   gcc_assert (size >= 0);
 107   return size;
 108 }
 109
 110 /* E is expected to be an edge being inlined.  Clone destination node of
 111    the edge and redirect it to the new clone.
 112    DUPLICATE is used for bookkeeping on whether we are actually creating new
 113    clones or re-using node originally representing out-of-line function call.
 114    */
 115 void
 116 cgraph_clone_inlined_nodes (struct cgraph_edge *e, bool duplicate, bool update_original)
 117 {
 118   struct cgraph_node *n;
 119
 120   /* We may eliminate the need for out-of-line copy to be output.  In that
 121      case just go ahead and re-use it.  */
 122   if (!e->callee->callers->next_caller
 123       && (!e->callee->needed || DECL_EXTERNAL (e->callee->decl))
 124       && duplicate
 125       && flag_unit_at_a_time)
 126     {
 127       gcc_assert (!e->callee->global.inlined_to);
 128       if (!DECL_EXTERNAL (e->callee->decl))
 129         overall_insns -= e->callee->global.insns, nfunctions_inlined++;
 130       duplicate = 0;
 131     }
 132    else if (duplicate)
 133     {
 134       n = cgraph_clone_node (e->callee, e->count, e->loop_nest, update_original);
 135       cgraph_redirect_edge_callee (e, n);
 136     }
 137
 138   if (e->caller->global.inlined_to)
 139     e->callee->global.inlined_to = e->caller->global.inlined_to;
 140   else
 141     e->callee->global.inlined_to = e->caller;
 142
 143   /* Recursively clone all bodies.  */
 144   for (e = e->callee->callees; e; e = e->next_callee)
 145     if (!e->inline_failed)
 146       cgraph_clone_inlined_nodes (e, duplicate, update_original);
 147 }
 148
 149 /* Mark edge E as inlined and update callgraph accordingly.
 150    UPDATE_ORIGINAL specify whether profile of original function should be
 151    updated. */
 152
 153 void
 154 cgraph_mark_inline_edge (struct cgraph_edge *e, bool update_original)
 155 {
 156   int old_insns = 0, new_insns = 0;
 157   struct cgraph_node *to = NULL, *what;
 158
 159   if (e->callee->inline_decl)
 160     cgraph_redirect_edge_callee (e, cgraph_node (e->callee->inline_decl));
 161
 162   gcc_assert (e->inline_failed);
 163   e->inline_failed = NULL;
 164
 165   if (!e->callee->global.inlined && flag_unit_at_a_time)
 166     DECL_POSSIBLY_INLINED (e->callee->decl) = true;
 167   e->callee->global.inlined = true;
 168
 169   cgraph_clone_inlined_nodes (e, true, update_original);
 170
 171   what = e->callee;
 172
 173   /* Now update size of caller and all functions caller is inlined into.  */
 174   for (;e && !e->inline_failed; e = e->caller->callers)
 175     {
 176       old_insns = e->caller->global.insns;
 177       new_insns = cgraph_estimate_size_after_inlining (1, e->caller,
 178                                                        what);
 179       gcc_assert (new_insns >= 0);
 180       to = e->caller;
 181       to->global.insns = new_insns;
 182     }
 183   gcc_assert (what->global.inlined_to == to);
 184   if (new_insns > old_insns)
 185     overall_insns += new_insns - old_insns;
 186   ncalls_inlined++;
 187 }
 188
 189 /* Mark all calls of EDGE->CALLEE inlined into EDGE->CALLER.
 190    Return following unredirected edge in the list of callers
 191    of EDGE->CALLEE  */
 192
 193 static struct cgraph_edge *
 194 cgraph_mark_inline (struct cgraph_edge *edge)
 195 {
 196   struct cgraph_node *to = edge->caller;
 197   struct cgraph_node *what = edge->callee;
 198   struct cgraph_edge *e, *next;
 199   int times = 0;
 200
 201   /* Look for all calls, mark them inline and clone recursively
 202      all inlined functions.  */
 203   for (e = what->callers; e; e = next)
 204     {
 205       next = e->next_caller;
 206       if (e->caller == to && e->inline_failed)
 207         {
 208           cgraph_mark_inline_edge (e, true);
 209           if (e == edge)
 210             edge = next;
 211           times++;
 212         }
 213     }
 214   gcc_assert (times);
 215   return edge;
 216 }
 217
 218 /* Estimate the growth caused by inlining NODE into all callees.  */
 219
 220 static int
 221 cgraph_estimate_growth (struct cgraph_node *node)
 222 {
 223   int growth = 0;
 224   struct cgraph_edge *e;
 225   if (node->global.estimated_growth != INT_MIN)
 226     return node->global.estimated_growth;
 227
 228   for (e = node->callers; e; e = e->next_caller)
 229     if (e->inline_failed)
 230       growth += (cgraph_estimate_size_after_inlining (1, e->caller, node)
 231                  - e->caller->global.insns);
 232
 233   /* ??? Wrong for self recursive functions or cases where we decide to not
 234      inline for different reasons, but it is not big deal as in that case
 235      we will keep the body around, but we will also avoid some inlining.  */
 236   if (!node->needed && !DECL_EXTERNAL (node->decl))
 237     growth -= node->global.insns;
 238
 239   node->global.estimated_growth = growth;
 240   return growth;
 241 }
 242
 243 /* Return false when inlining WHAT into TO is not good idea
 244    as it would cause too large growth of function bodies.  */
 245
 246 static bool
 247 cgraph_check_inline_limits (struct cgraph_node *to, struct cgraph_node *what,
 248                             const char **reason)
 249 {
 250   int times = 0;
 251   struct cgraph_edge *e;
 252   int newsize;
 253   int limit;
 254
 255   if (to->global.inlined_to)
 256     to = to->global.inlined_to;
 257
 258   for (e = to->callees; e; e = e->next_callee)
 259     if (e->callee == what)
 260       times++;
 261
 262   /* When inlining large function body called once into small function,
 263      take the inlined function as base for limiting the growth.  */
 264   if (to->local.self_insns > what->local.self_insns)
 265     limit = to->local.self_insns;
 266   else
 267     limit = what->local.self_insns;
 268
 269   limit += limit * PARAM_VALUE (PARAM_LARGE_FUNCTION_GROWTH) / 100;
 270
 271   newsize = cgraph_estimate_size_after_inlining (times, to, what);
 272   if (newsize > PARAM_VALUE (PARAM_LARGE_FUNCTION_INSNS)
 273       && newsize > limit)
 274     {
 275       if (reason)
 276         *reason = N_("--param large-function-growth limit reached");
 277       return false;
 278     }
 279   return true;
 280 }
 281
 282 /* Return true when function N is small enough to be inlined.  */
 283
 284 bool
 285 cgraph_default_inline_p (struct cgraph_node *n, const char **reason)
 286 {
 287   tree decl = n->decl;
 288
 289   if (n->inline_decl)
 290     decl = n->inline_decl;
 291   if (!DECL_INLINE (decl))
 292     {
 293       if (reason)
 294         *reason = N_("function not inlinable");
 295       return false;
 296     }
 297
 298   if (!DECL_STRUCT_FUNCTION (decl)->cfg)
 299     {
 300       if (reason)
 301         *reason = N_("function body not available");
 302       return false;
 303     }
 304
 305   if (DECL_DECLARED_INLINE_P (decl))
 306     {
 307       if (n->global.insns >= MAX_INLINE_INSNS_SINGLE)
 308         {
 309           if (reason)
 310             *reason = N_("--param max-inline-insns-single limit reached");
 311           return false;
 312         }
 313     }
 314   else
 315     {
 316       if (n->global.insns >= MAX_INLINE_INSNS_AUTO)
 317         {
 318           if (reason)
 319             *reason = N_("--param max-inline-insns-auto limit reached");
 320           return false;
 321         }
 322     }
 323
 324   return true;
 325 }
 326
 327 /* Return true when inlining WHAT would create recursive inlining.
 328    We call recursive inlining all cases where same function appears more than
 329    once in the single recursion nest path in the inline graph.  */
 330
 331 static bool
 332 cgraph_recursive_inlining_p (struct cgraph_node *to,
 333                              struct cgraph_node *what,
 334                              const char **reason)
 335 {
 336   bool recursive;
 337   if (to->global.inlined_to)
 338     recursive = what->decl == to->global.inlined_to->decl;
 339   else
 340     recursive = what->decl == to->decl;
 341   /* Marking recursive function inline has sane semantic and thus we should
 342      not warn on it.  */
 343   if (recursive && reason)
 344     *reason = (what->local.disregard_inline_limits
 345                ? N_("recursive inlining") : "");
 346   return recursive;
 347 }
 348
 349 /* Return true if the call can be hot.  */
 350 static bool
 351 cgraph_maybe_hot_edge_p (struct cgraph_edge *edge)
 352 {
 353   if (profile_info && flag_branch_probabilities
 354       && (edge->count
 355           <= profile_info->sum_max / PARAM_VALUE (HOT_BB_COUNT_FRACTION)))
 356     return false;
 357   return true;
 358 }
 359
 360 /* A cost model driving the inlining heuristics in a way so the edges with
 361    smallest badness are inlined first.  After each inlining is performed
 362    the costs of all caller edges of nodes affected are recomputed so the
 363    metrics may accurately depend on values such as number of inlinable callers
 364    of the function or function body size.
 365
 366    With profiling we use number of executions of each edge to drive the cost.
 367    We also should distinguish hot and cold calls where the cold calls are
 368    inlined into only when code size is overall improved.
 369    */
 370
 371 static int
 372 cgraph_edge_badness (struct cgraph_edge *edge)
 373 {
 374   if (max_count)
 375     {
 376       int growth =
 377         cgraph_estimate_size_after_inlining (1, edge->caller, edge->callee);
 378       growth -= edge->caller->global.insns;
 379
 380       /* Always prefer inlining saving code size.  */
 381       if (growth <= 0)
 382         return INT_MIN - growth;
 383       return ((int)((double)edge->count * INT_MIN / max_count)) / growth;
 384     }
 385   else
 386   {
 387     int nest = MIN (edge->loop_nest, 8);
 388     int badness = cgraph_estimate_growth (edge->callee) * 256;
 389
 390     /* Decrease badness if call is nested.  */
 391     if (badness > 0)
 392       badness >>= nest;
 393     else
 394       badness <<= nest;
 395
 396     /* Make recursive inlining happen always after other inlining is done.  */
 397     if (cgraph_recursive_inlining_p (edge->caller, edge->callee, NULL))
 398       return badness + 1;
 399     else
 400       return badness;
 401   }
 402 }
 403
 404 /* Recompute heap nodes for each of caller edge.  */
 405
 406 static void
 407 update_caller_keys (fibheap_t heap, struct cgraph_node *node,
 408                     bitmap updated_nodes)
 409 {
 410   struct cgraph_edge *edge;
 411
 412   if (!node->local.inlinable || node->local.disregard_inline_limits
 413       || node->global.inlined_to)
 414     return;
 415   if (bitmap_bit_p (updated_nodes, node->uid))
 416     return;
 417   bitmap_set_bit (updated_nodes, node->uid);
 418   node->global.estimated_growth = INT_MIN;
 419
 420   for (edge = node->callers; edge; edge = edge->next_caller)
 421     if (edge->inline_failed)
 422       {
 423         int badness = cgraph_edge_badness (edge);
 424         if (edge->aux)
 425           {
 426             fibnode_t n = edge->aux;
 427             gcc_assert (n->data == edge);
 428             if (n->key == badness)
 429               continue;
 430
 431             /* fibheap_replace_key only increase the keys.  */
 432             if (fibheap_replace_key (heap, n, badness))
 433               continue;
 434             fibheap_delete_node (heap, edge->aux);
 435           }
 436         edge->aux = fibheap_insert (heap, badness, edge);
 437       }
 438 }
 439
 440 /* Recompute heap nodes for each of caller edges of each of callees.  */
 441
 442 static void
 443 update_callee_keys (fibheap_t heap, struct cgraph_node *node,
 444                     bitmap updated_nodes)
 445 {
 446   struct cgraph_edge *e;
 447   node->global.estimated_growth = INT_MIN;
 448
 449   for (e = node->callees; e; e = e->next_callee)
 450     if (e->inline_failed)
 451       update_caller_keys (heap, e->callee, updated_nodes);
 452     else if (!e->inline_failed)
 453       update_callee_keys (heap, e->callee, updated_nodes);
 454 }
 455
 456 /* Enqueue all recursive calls from NODE into priority queue depending on
 457    how likely we want to recursively inline the call.  */
 458
 459 static void
 460 lookup_recursive_calls (struct cgraph_node *node, struct cgraph_node *where,
 461                         fibheap_t heap)
 462 {
 463   static int priority;
 464   struct cgraph_edge *e;
 465   for (e = where->callees; e; e = e->next_callee)
 466     if (e->callee == node)
 467       {
 468         /* When profile feedback is available, prioritize by expected number
 469            of calls.  Without profile feedback we maintain simple queue
 470            to order candidates via recursive depths.  */
 471         fibheap_insert (heap,
 472                         !max_count ? priority++
 473                         : -(e->count / ((max_count + (1<<24) - 1) / (1<<24))),
 474                         e);
 475       }
 476   for (e = where->callees; e; e = e->next_callee)
 477     if (!e->inline_failed)
 478       lookup_recursive_calls (node, e->callee, heap);
 479 }
 480
 481 /* Find callgraph nodes closing a circle in the graph.  The
 482    resulting hashtab can be used to avoid walking the circles.
 483    Uses the cgraph nodes ->aux field which needs to be zero
 484    before and will be zero after operation.  */
 485
 486 static void
 487 cgraph_find_cycles (struct cgraph_node *node, htab_t cycles)
 488 {
 489   struct cgraph_edge *e;
 490
 491   if (node->aux)
 492     {
 493       void **slot;
 494       slot = htab_find_slot (cycles, node, INSERT);
 495       if (!*slot)
 496         {
 497           if (dump_file)
 498             fprintf (dump_file, "Cycle contains %s\n", cgraph_node_name (node));
 499           *slot = node;
 500         }
 501       return;
 502     }
 503
 504   node->aux = node;
 505   for (e = node->callees; e; e = e->next_callee)
 506     cgraph_find_cycles (e->callee, cycles);
 507   node->aux = 0;
 508 }
 509
 510
 511 static void
 512 cgraph_apply_inline_plan (void)
 513 {
 514   struct cgraph_node *node;
 515   struct cgraph_node **order =
 516     xcalloc (cgraph_n_nodes, sizeof (struct cgraph_node *));
 517   int order_pos = 0, new_order_pos = 0;
 518   int i;
 519
 520   timevar_push (TV_INTEGRATION);
 521   order_pos = cgraph_postorder (order);
 522   gcc_assert (order_pos == cgraph_n_nodes);
 523
 524   /* Garbage collector may remove inline clones we eliminate during
 525      optimization.  So we must be sure to not reference them.  */
 526   for (i = 0; i < order_pos; i++)
 527     if (!order[i]->global.inlined_to)
 528       order[new_order_pos++] = order[i];
 529
 530   /* Initialize the default bitmap obstack.  */
 531   bitmap_obstack_initialize (NULL);
 532
 533
 534   for (i = 0; i < new_order_pos; i++)
 535     {
 536       struct cgraph_edge *e;
 537
 538       node = order[i];
 539       for (e = node->callees; e; e = e->next_callee)
 540         if (!e->inline_failed || warn_inline)
 541           break;
 542       if (e)
 543         {
 544           if (cgraph_preserve_function_body_p (node->decl, true))
 545             save_inline_function_body (node);
 546           push_cfun (DECL_STRUCT_FUNCTION (node->decl));
 547           tree_register_cfg_hooks ();
 548           current_function_decl = node->decl;
 549           optimize_inline_calls (node->decl, false);
 550           free_dominance_info (CDI_DOMINATORS);
 551           free_dominance_info (CDI_POST_DOMINATORS);
 552           node->local.self_insns = node->global.insns;
 553           pop_cfun ();
 554           ggc_collect ();
 555         }
 556     }
 557   free (order);
 558   timevar_pop (TV_INTEGRATION);
 559 }
 560
 561 /* Leafify the cgraph node.  We have to be careful in recursing
 562    as to not run endlessly in circles of the callgraph.
 563    We do so by using a hashtab of cycle entering nodes as generated
 564    by cgraph_find_cycles.  */
 565
 566 static void
 567 cgraph_flatten_node (struct cgraph_node *node, htab_t cycles)
 568 {
 569   struct cgraph_edge *e;
 570
 571   for (e = node->callees; e; e = e->next_callee)
 572     {
 573       /* Inline call, if possible, and recurse.  Be sure we are not
 574          entering callgraph circles here.  */
 575       if (e->inline_failed
 576           && e->callee->local.inlinable
 577           && !cgraph_recursive_inlining_p (node, e->callee,
 578                                            &e->inline_failed)
 579           && !htab_find (cycles, e->callee))
 580         {
 581           if (dump_file)
 582             fprintf (dump_file, " inlining %s", cgraph_node_name (e->callee));
 583           cgraph_mark_inline_edge (e, true);
 584           cgraph_flatten_node (e->callee, cycles);
 585         }
 586       else if (dump_file)
 587         fprintf (dump_file, " !inlining %s", cgraph_node_name (e->callee));
 588     }
 589 }
 590
 591 /* Decide on recursive inlining: in the case function has recursive calls,
 592    inline until body size reaches given argument.  */
 593
 594 static bool
 595 cgraph_decide_recursive_inlining (struct cgraph_node *node)
 596 {
 597   int limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE_AUTO);
 598   int max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH_AUTO);
 599   int probability = PARAM_VALUE (PARAM_MIN_INLINE_RECURSIVE_PROBABILITY);
 600   fibheap_t heap;
 601   struct cgraph_edge *e;
 602   struct cgraph_node *master_clone;
 603   int depth = 0;
 604   int n = 0;
 605
 606   if (DECL_DECLARED_INLINE_P (node->decl))
 607     {
 608       limit = PARAM_VALUE (PARAM_MAX_INLINE_INSNS_RECURSIVE);
 609       max_depth = PARAM_VALUE (PARAM_MAX_INLINE_RECURSIVE_DEPTH);
 610     }
 611
 612   /* Make sure that function is small enough to be considered for inlining.  */
 613   if (!max_depth
 614       || cgraph_estimate_size_after_inlining (1, node, node)  >= limit)
 615     return false;
 616   heap = fibheap_new ();
 617   lookup_recursive_calls (node, node, heap);
 618   if (fibheap_empty (heap))
 619     {
 620       fibheap_delete (heap);
 621       return false;
 622     }
 623
 624   if (dump_file)
 625     fprintf (dump_file,
 626              "  Performing recursive inlining on %s\n",
 627              cgraph_node_name (node));
 628
 629   /* We need original clone to copy around.  */
 630   master_clone = cgraph_clone_node (node, node->count, 1, false);
 631   master_clone->needed = true;
 632   for (e = master_clone->callees; e; e = e->next_callee)
 633     if (!e->inline_failed)
 634       cgraph_clone_inlined_nodes (e, true, false);
 635
 636   /* Do the inlining and update list of recursive call during process.  */
 637   while (!fibheap_empty (heap)
 638          && (cgraph_estimate_size_after_inlining (1, node, master_clone)
 639              <= limit))
 640     {
 641       struct cgraph_edge *curr = fibheap_extract_min (heap);
 642       struct cgraph_node *cnode;
 643
 644       depth = 1;
 645       for (cnode = curr->caller;
 646            cnode->global.inlined_to; cnode = cnode->callers->caller)
 647         if (node->decl == curr->callee->decl)
 648           depth++;
 649       if (depth > max_depth)
 650         {
 651           if (dump_file)
 652             fprintf (dump_file,
 653                      "   maxmal depth reached\n");
 654           continue;
 655         }
 656
 657       if (max_count)
 658         {
 659           if (!cgraph_maybe_hot_edge_p (curr))
 660             {
 661               if (dump_file)
 662                 fprintf (dump_file, "   Not inlining cold call\n");
 663               continue;
 664             }
 665           if (curr->count * 100 / node->count < probability)
 666             {
 667               if (dump_file)
 668                 fprintf (dump_file,
 669                          "   Probability of edge is too small\n");
 670               continue;
 671             }
 672         }
 673
 674       if (dump_file)
 675         {
 676           fprintf (dump_file,
 677                    "   Inlining call of depth %i", depth);
 678           if (node->count)
 679             {
 680               fprintf (dump_file, " called approx. %.2f times per call",
 681                        (double)curr->count / node->count);
 682             }
 683           fprintf (dump_file, "\n");
 684         }
 685       cgraph_redirect_edge_callee (curr, master_clone);
 686       cgraph_mark_inline_edge (curr, false);
 687       lookup_recursive_calls (node, curr->callee, heap);
 688       n++;
 689     }
 690   if (!fibheap_empty (heap) && dump_file)
 691     fprintf (dump_file, "    Recursive inlining growth limit met.\n");
 692
 693   fibheap_delete (heap);
 694   if (dump_file)
 695     fprintf (dump_file,
 696              "\n   Inlined %i times, body grown from %i to %i insns\n", n,
 697              master_clone->global.insns, node->global.insns);
 698
 699   /* Remove master clone we used for inlining.  We rely that clones inlined
 700      into master clone gets queued just before master clone so we don't
 701      need recursion.  */
 702   for (node = cgraph_nodes; node != master_clone;
 703        node = node->next)
 704     if (node->global.inlined_to == master_clone)
 705       cgraph_remove_node (node);
 706   cgraph_remove_node (master_clone);
 707   /* FIXME: Recursive inlining actually reduces number of calls of the
 708      function.  At this place we should probably walk the function and
 709      inline clones and compensate the counts accordingly.  This probably
 710      doesn't matter much in practice.  */
 711   return n > 0;
 712 }
 713
 714 /* Set inline_failed for all callers of given function to REASON.  */
 715
 716 static void
 717 cgraph_set_inline_failed (struct cgraph_node *node, const char *reason)
 718 {
 719   struct cgraph_edge *e;
 720
 721   if (dump_file)
 722     fprintf (dump_file, "Inlining failed: %s\n", reason);
 723   for (e = node->callers; e; e = e->next_caller)
 724     if (e->inline_failed)
 725       e->inline_failed = reason;
 726 }
 727
 728 /* We use greedy algorithm for inlining of small functions:
 729    All inline candidates are put into prioritized heap based on estimated
 730    growth of the overall number of instructions and then update the estimates.
 731
 732    INLINED and INLINED_CALEES are just pointers to arrays large enough
 733    to be passed to cgraph_inlined_into and cgraph_inlined_callees.  */
 734
 735 static void
 736 cgraph_decide_inlining_of_small_functions (void)
 737 {
 738   struct cgraph_node *node;
 739   struct cgraph_edge *edge;
 740   const char *failed_reason;
 741   fibheap_t heap = fibheap_new ();
 742   bitmap updated_nodes = BITMAP_ALLOC (NULL);
 743
 744   if (dump_file)
 745     fprintf (dump_file, "\nDeciding on smaller functions:\n");
 746
 747   /* Put all inline candidates into the heap.  */
 748
 749   for (node = cgraph_nodes; node; node = node->next)
 750     {
 751       if (!node->local.inlinable || !node->callers
 752           || node->local.disregard_inline_limits)
 753         continue;
 754       if (dump_file)
 755         fprintf (dump_file, "Considering inline candidate %s.\n", cgraph_node_name (node));
 756
 757       node->global.estimated_growth = INT_MIN;
 758       if (!cgraph_default_inline_p (node, &failed_reason))
 759         {
 760           cgraph_set_inline_failed (node, failed_reason);
 761           continue;
 762         }
 763
 764       for (edge = node->callers; edge; edge = edge->next_caller)
 765         if (edge->inline_failed)
 766           {
 767             gcc_assert (!edge->aux);
 768             edge->aux = fibheap_insert (heap, cgraph_edge_badness (edge), edge);
 769           }
 770     }
 771   while (overall_insns <= max_insns && (edge = fibheap_extract_min (heap)))
 772     {
 773       int old_insns = overall_insns;
 774       struct cgraph_node *where;
 775       int growth =
 776         cgraph_estimate_size_after_inlining (1, edge->caller, edge->callee);
 777
 778       growth -= edge->caller->global.insns;
 779
 780       if (dump_file)
 781         {
 782           fprintf (dump_file,
 783                    "\nConsidering %s with %i insns\n",
 784                    cgraph_node_name (edge->callee),
 785                    edge->callee->global.insns);
 786           fprintf (dump_file,
 787                    " to be inlined into %s\n"
 788                    " Estimated growth after inlined into all callees is %+i insns.\n"
 789                    " Estimated badness is %i.\n",
 790                    cgraph_node_name (edge->caller),
 791                    cgraph_estimate_growth (edge->callee),
 792                    cgraph_edge_badness (edge));
 793           if (edge->count)
 794             fprintf (dump_file," Called "HOST_WIDEST_INT_PRINT_DEC"x\n", edge->count);
 795         }
 796       gcc_assert (edge->aux);
 797       edge->aux = NULL;
 798       if (!edge->inline_failed)
 799         continue;
 800
 801       /* When not having profile info ready we don't weight by any way the
 802          position of call in procedure itself.  This means if call of
 803          function A from function B seems profitable to inline, the recursive
 804          call of function A in inline copy of A in B will look profitable too
 805          and we end up inlining until reaching maximal function growth.  This
 806          is not good idea so prohibit the recursive inlining.
 807
 808          ??? When the frequencies are taken into account we might not need this
 809          restriction.   */
 810       if (!max_count)
 811         {
 812           where = edge->caller;
 813           while (where->global.inlined_to)
 814             {
 815               if (where->decl == edge->callee->decl)
 816                 break;
 817               where = where->callers->caller;
 818             }
 819           if (where->global.inlined_to)
 820             {
 821               edge->inline_failed
 822                 = (edge->callee->local.disregard_inline_limits ? N_("recursive inlining") : "");
 823               if (dump_file)
 824                 fprintf (dump_file, " inline_failed:Recursive inlining performed only for function itself.\n");
 825               continue;
 826             }
 827         }
 828
 829       if (!cgraph_maybe_hot_edge_p (edge) && growth > 0)
 830         {
 831           if (!cgraph_recursive_inlining_p (edge->caller, edge->callee,
 832                                             &edge->inline_failed))
 833             {
 834               edge->inline_failed =
 835                 N_("call is unlikely");
 836               if (dump_file)
 837                 fprintf (dump_file, " inline_failed:%s.\n", edge->inline_failed);
 838             }
 839           continue;
 840         }
 841       if (!cgraph_default_inline_p (edge->callee, &edge->inline_failed))
 842         {
 843           if (!cgraph_recursive_inlining_p (edge->caller, edge->callee,
 844                                             &edge->inline_failed))
 845             {
 846               if (dump_file)
 847                 fprintf (dump_file, " inline_failed:%s.\n", edge->inline_failed);
 848             }
 849           continue;
 850         }
 851       if (cgraph_recursive_inlining_p (edge->caller, edge->callee,
 852                                        &edge->inline_failed))
 853         {
 854           where = edge->caller;
 855           if (where->global.inlined_to)
 856             where = where->global.inlined_to;
 857           if (!cgraph_decide_recursive_inlining (where))
 858             continue;
 859           update_callee_keys (heap, where, updated_nodes);
 860         }
 861       else
 862         {
 863           struct cgraph_node *callee;
 864           if (!cgraph_check_inline_limits (edge->caller, edge->callee,
 865                                            &edge->inline_failed))
 866             {
 867               if (dump_file)
 868                 fprintf (dump_file, " Not inlining into %s:%s.\n",
 869                          cgraph_node_name (edge->caller), edge->inline_failed);
 870               continue;
 871             }
 872           callee = edge->callee;
 873           cgraph_mark_inline_edge (edge, true);
 874           update_callee_keys (heap, callee, updated_nodes);
 875         }
 876       where = edge->caller;
 877       if (where->global.inlined_to)
 878         where = where->global.inlined_to;
 879
 880       /* Our profitability metric can depend on local properties
 881          such as number of inlinable calls and size of the function body.
 882          After inlining these properties might change for the function we
 883          inlined into (since it's body size changed) and for the functions
 884          called by function we inlined (since number of it inlinable callers
 885          might change).  */
 886       update_caller_keys (heap, where, updated_nodes);
 887       bitmap_clear (updated_nodes);
 888
 889       if (dump_file)
 890         {
 891           fprintf (dump_file,
 892                    " Inlined into %s which now has %i insns,"
 893                    "net change of %+i insns.\n",
 894                    cgraph_node_name (edge->caller),
 895                    edge->caller->global.insns,
 896                    overall_insns - old_insns);
 897         }
 898     }
 899   while ((edge = fibheap_extract_min (heap)) != NULL)
 900     {
 901       gcc_assert (edge->aux);
 902       edge->aux = NULL;
 903       if (!edge->callee->local.disregard_inline_limits && edge->inline_failed
 904           && !cgraph_recursive_inlining_p (edge->caller, edge->callee,
 905                                            &edge->inline_failed))
 906         edge->inline_failed = N_("--param inline-unit-growth limit reached");
 907     }
 908   fibheap_delete (heap);
 909   BITMAP_FREE (updated_nodes);
 910 }
 911
 912 /* Decide on the inlining.  We do so in the topological order to avoid
 913    expenses on updating data structures.  */
 914
 915 static void
 916 cgraph_decide_inlining (void)
 917 {
 918   struct cgraph_node *node;
 919   int nnodes;
 920   struct cgraph_node **order =
 921     xcalloc (cgraph_n_nodes, sizeof (struct cgraph_node *));
 922   int old_insns = 0;
 923   int i;
 924
 925   timevar_push (TV_INLINE_HEURISTICS);
 926   max_count = 0;
 927   for (node = cgraph_nodes; node; node = node->next)
 928     {
 929       struct cgraph_edge *e;
 930       initial_insns += node->local.self_insns;
 931       for (e = node->callees; e; e = e->next_callee)
 932         if (max_count < e->count)
 933           max_count = e->count;
 934     }
 935   overall_insns = initial_insns;
 936   gcc_assert (!max_count || (profile_info && flag_branch_probabilities));
 937
 938   max_insns = overall_insns;
 939   if (max_insns < PARAM_VALUE (PARAM_LARGE_UNIT_INSNS))
 940     max_insns = PARAM_VALUE (PARAM_LARGE_UNIT_INSNS);
 941
 942   max_insns = ((HOST_WIDEST_INT) max_insns
 943                * (100 + PARAM_VALUE (PARAM_INLINE_UNIT_GROWTH)) / 100);
 944
 945   nnodes = cgraph_postorder (order);
 946
 947   if (dump_file)
 948     fprintf (dump_file,
 949              "\nDeciding on inlining.  Starting with %i insns.\n",
 950              initial_insns);
 951
 952   for (node = cgraph_nodes; node; node = node->next)
 953     node->aux = 0;
 954
 955   if (dump_file)
 956     fprintf (dump_file, "\nInlining always_inline functions:\n");
 957
 958   /* In the first pass mark all always_inline edges.  Do this with a priority
 959      so none of our later choices will make this impossible.  */
 960   for (i = nnodes - 1; i >= 0; i--)
 961     {
 962       struct cgraph_edge *e, *next;
 963
 964       node = order[i];
 965
 966       /* Handle nodes to be flattened, but don't update overall unit size.  */
 967       if (lookup_attribute ("flatten", DECL_ATTRIBUTES (node->decl)) != NULL)
 968         {
 969           int old_overall_insns = overall_insns;
 970           htab_t cycles;
 971           if (dump_file)
 972             fprintf (dump_file,
 973                      "Leafifying %s\n", cgraph_node_name (node));
 974           cycles = htab_create (7, htab_hash_pointer, htab_eq_pointer, NULL);
 975           cgraph_find_cycles (node, cycles);
 976           cgraph_flatten_node (node, cycles);
 977           htab_delete (cycles);
 978           overall_insns = old_overall_insns;
 979           /* We don't need to consider always_inline functions inside the flattened
 980              function anymore.  */
 981           continue;
 982         }
 983
 984       if (!node->local.disregard_inline_limits)
 985         continue;
 986       if (dump_file)
 987         fprintf (dump_file,
 988                  "\nConsidering %s %i insns (always inline)\n",
 989                  cgraph_node_name (node), node->global.insns);
 990       old_insns = overall_insns;
 991       for (e = node->callers; e; e = next)
 992         {
 993           next = e->next_caller;
 994           if (!e->inline_failed)
 995             continue;
 996           if (cgraph_recursive_inlining_p (e->caller, e->callee,
 997                                            &e->inline_failed))
 998             continue;
 999           cgraph_mark_inline_edge (e, true);
1000           if (dump_file)
1001             fprintf (dump_file,
1002                      " Inlined into %s which now has %i insns.\n",
1003                      cgraph_node_name (e->caller),
1004                      e->caller->global.insns);
1005         }
1006       if (dump_file)
1007         fprintf (dump_file,
1008                  " Inlined for a net change of %+i insns.\n",
1009                  overall_insns - old_insns);
1010     }
1011
1012   if (!flag_really_no_inline)
1013     cgraph_decide_inlining_of_small_functions ();
1014
1015   if (!flag_really_no_inline
1016       && flag_inline_functions_called_once)
1017     {
1018       if (dump_file)
1019         fprintf (dump_file, "\nDeciding on functions called once:\n");
1020
1021       /* And finally decide what functions are called once.  */
1022
1023       for (i = nnodes - 1; i >= 0; i--)
1024         {
1025           node = order[i];
1026
1027           if (node->callers && !node->callers->next_caller && !node->needed
1028               && node->local.inlinable && node->callers->inline_failed
1029               && !DECL_EXTERNAL (node->decl) && !DECL_COMDAT (node->decl))
1030             {
1031               bool ok = true;
1032               struct cgraph_node *node1;
1033
1034               /* Verify that we won't duplicate the caller.  */
1035               for (node1 = node->callers->caller;
1036                    node1->callers && !node1->callers->inline_failed
1037                    && ok; node1 = node1->callers->caller)
1038                 if (node1->callers->next_caller || node1->needed)
1039                   ok = false;
1040               if (ok)
1041                 {
1042                   if (dump_file)
1043                     {
1044                       fprintf (dump_file,
1045                                "\nConsidering %s %i insns.\n",
1046                                cgraph_node_name (node), node->global.insns);
1047                       fprintf (dump_file,
1048                                " Called once from %s %i insns.\n",
1049                                cgraph_node_name (node->callers->caller),
1050                                node->callers->caller->global.insns);
1051                     }
1052
1053                   old_insns = overall_insns;
1054
1055                   if (cgraph_check_inline_limits (node->callers->caller, node,
1056                                                   NULL))
1057                     {
1058                       cgraph_mark_inline (node->callers);
1059                       if (dump_file)
1060                         fprintf (dump_file,
1061                                  " Inlined into %s which now has %i insns"
1062                                  " for a net change of %+i insns.\n",
1063                                  cgraph_node_name (node->callers->caller),
1064                                  node->callers->caller->global.insns,
1065                                  overall_insns - old_insns);
1066                     }
1067                   else
1068                     {
1069                       if (dump_file)
1070                         fprintf (dump_file,
1071                                  " Inline limit reached, not inlined.\n");
1072                     }
1073                 }
1074             }
1075         }
1076     }
1077
1078   cgraph_remove_unreachable_nodes (false, dump_file);
1079   cgraph_apply_inline_plan ();
1080   cgraph_remove_unreachable_nodes (false, dump_file);
1081
1082   if (dump_file)
1083     fprintf (dump_file,
1084              "\nInlined %i calls, eliminated %i functions, "
1085              "%i insns turned to %i insns.\n\n",
1086              ncalls_inlined, nfunctions_inlined, initial_insns,
1087              overall_insns);
1088   free (order);
1089   timevar_pop (TV_INLINE_HEURISTICS);
1090 }
1091
1092 /* Decide on the inlining.  We do so in the topological order to avoid
1093    expenses on updating data structures.  */
1094
1095 bool
1096 cgraph_decide_inlining_incrementally (struct cgraph_node *node, bool early)
1097 {
1098   struct cgraph_edge *e;
1099   bool inlined = false;
1100   const char *failed_reason;
1101
1102   /* First of all look for always inline functions.  */
1103   for (e = node->callees; e; e = e->next_callee)
1104     if (e->callee->local.disregard_inline_limits
1105         && e->inline_failed
1106         && !cgraph_recursive_inlining_p (node, e->callee, &e->inline_failed)
1107         /* ??? It is possible that renaming variable removed the function body
1108            in duplicate_decls. See gcc.c-torture/compile/20011119-2.c  */
1109         && (DECL_SAVED_TREE (e->callee->decl) || e->callee->inline_decl))
1110       {
1111         if (dump_file && early)
1112           {
1113             fprintf (dump_file, "  Early inlining %s",
1114                      cgraph_node_name (e->callee));
1115             fprintf (dump_file, " into %s\n", cgraph_node_name (node));
1116           }
1117         cgraph_mark_inline (e);
1118         inlined = true;
1119       }
1120
1121   /* Now do the automatic inlining.  */
1122   if (!flag_really_no_inline)
1123     for (e = node->callees; e; e = e->next_callee)
1124       if (e->callee->local.inlinable
1125           && e->inline_failed
1126           && !e->callee->local.disregard_inline_limits
1127           && !cgraph_recursive_inlining_p (node, e->callee, &e->inline_failed)
1128           && (!early
1129               || (cgraph_estimate_size_after_inlining (1, e->caller, node)
1130                   <= e->caller->global.insns))
1131           && cgraph_check_inline_limits (node, e->callee, &e->inline_failed)
1132           && (DECL_SAVED_TREE (e->callee->decl) || e->callee->inline_decl))
1133         {
1134           if (cgraph_default_inline_p (e->callee, &failed_reason))
1135             {
1136               if (dump_file && early)
1137                 {
1138                   fprintf (dump_file, "  Early inlining %s",
1139                            cgraph_node_name (e->callee));
1140                   fprintf (dump_file, " into %s\n", cgraph_node_name (node));
1141                 }
1142               cgraph_mark_inline (e);
1143               inlined = true;
1144             }
1145           else if (!early)
1146             e->inline_failed = failed_reason;
1147         }
1148   if (inlined || (warn_inline && !early))
1149     {
1150       /* Initialize the default bitmap obstack.  */
1151       bitmap_obstack_initialize (NULL);
1152       push_cfun (DECL_STRUCT_FUNCTION (node->decl));
1153       tree_register_cfg_hooks ();
1154       current_function_decl = node->decl;
1155       optimize_inline_calls (current_function_decl, early);
1156       free_dominance_info (CDI_DOMINATORS);
1157       free_dominance_info (CDI_POST_DOMINATORS);
1158       node->local.self_insns = node->global.insns;
1159       current_function_decl = NULL;
1160       pop_cfun ();
1161     }
1162   return inlined;
1163 }
1164
1165 /* When inlining shall be performed.  */
1166 static bool
1167 cgraph_gate_inlining (void)
1168 {
1169   return flag_inline_trees /*&& 0*/;
1170 }
1171
1172 struct tree_opt_pass pass_ipa_inline =
1173 {
1174   "inline",                             /* name */
1175   cgraph_gate_inlining,                 /* gate */
1176   cgraph_decide_inlining,               /* execute */
1177   NULL,                                 /* sub */
1178   NULL,                                 /* next */
1179   0,                                    /* static_pass_number */
1180   TV_INTEGRATION,                       /* tv_id */
1181   0,                                    /* properties_required */
1182   PROP_cfg,                             /* properties_provided */
1183   0,                                    /* properties_destroyed */
1184   0,                                    /* todo_flags_start */
1185   TODO_dump_cgraph | TODO_dump_func,    /* todo_flags_finish */
1186   0                                     /* letter */
1187 };
1188
1189 /* Do inlining of small functions.  Doing so early helps profiling and other
1190    passes to be somewhat more effective and avoids some code duplication in
1191    later real inlining pass for testcases with very many function calls.  */
1192 static void
1193 cgraph_early_inlining (void)
1194 {
1195   struct cgraph_node *node;
1196   int nnodes;
1197   struct cgraph_node **order =
1198     xcalloc (cgraph_n_nodes, sizeof (struct cgraph_node *));
1199   int i;
1200
1201   if (sorrycount || errorcount)
1202     return;
1203 #ifdef ENABLE_CHECKING
1204   for (node = cgraph_nodes; node; node = node->next)
1205     gcc_assert (!node->aux);
1206 #endif
1207
1208   nnodes = cgraph_postorder (order);
1209   for (i = nnodes - 1; i >= 0; i--)
1210     {
1211       node = order[i];
1212       if (node->analyzed && node->local.inlinable
1213           && (node->needed || node->reachable)
1214           && node->callers)
1215         cgraph_decide_inlining_incrementally (node, true);
1216     }
1217   cgraph_remove_unreachable_nodes (true, dump_file);
1218 #ifdef ENABLE_CHECKING
1219   for (node = cgraph_nodes; node; node = node->next)
1220     gcc_assert (!node->global.inlined_to);
1221 #endif
1222   free (order);
1223 }
1224
1225 /* When inlining shall be performed.  */
1226 static bool
1227 cgraph_gate_early_inlining (void)
1228 {
1229   return flag_inline_trees && flag_early_inlining;
1230 }
1231
1232 struct tree_opt_pass pass_early_ipa_inline =
1233 {
1234   "einline",                            /* name */
1235   cgraph_gate_early_inlining,           /* gate */
1236   cgraph_early_inlining,                /* execute */
1237   NULL,                                 /* sub */
1238   NULL,                                 /* next */
1239   0,                                    /* static_pass_number */
1240   TV_INTEGRATION,                       /* tv_id */
1241   0,                                    /* properties_required */
1242   PROP_cfg,                             /* properties_provided */
1243   0,                                    /* properties_destroyed */
1244   0,                                    /* todo_flags_start */
1245   TODO_dump_cgraph | TODO_dump_func,    /* todo_flags_finish */
1246   0                                     /* letter */
1247 };