gcc/ipa-inline-analysis.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003-2015 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* Analysis used by the inliner and other passes limiting code size growth.
  22
  23    We estimate for each function
  24      - function body size
  25      - average function execution time
  26      - inlining size benefit (that is how much of function body size
  27        and its call sequence is expected to disappear by inlining)
  28      - inlining time benefit
  29      - function frame size
  30    For each call
  31      - call statement size and time
  32
  33    inlinie_summary datastructures store above information locally (i.e.
  34    parameters of the function itself) and globally (i.e. parameters of
  35    the function created by applying all the inline decisions already
  36    present in the callgraph).
  37
  38    We provide accestor to the inline_summary datastructure and
  39    basic logic updating the parameters when inlining is performed.
  40
  41    The summaries are context sensitive.  Context means
  42      1) partial assignment of known constant values of operands
  43      2) whether function is inlined into the call or not.
  44    It is easy to add more variants.  To represent function size and time
  45    that depends on context (i.e. it is known to be optimized away when
  46    context is known either by inlining or from IP-CP and clonning),
  47    we use predicates. Predicates are logical formulas in
  48    conjunctive-disjunctive form consisting of clauses. Clauses are bitmaps
  49    specifying what conditions must be true. Conditions are simple test
  50    of the form described above.
  51
  52    In order to make predicate (possibly) true, all of its clauses must
  53    be (possibly) true. To make clause (possibly) true, one of conditions
  54    it mentions must be (possibly) true.  There are fixed bounds on
  55    number of clauses and conditions and all the manipulation functions
  56    are conservative in positive direction. I.e. we may lose precision
  57    by thinking that predicate may be true even when it is not.
  58
  59    estimate_edge_size and estimate_edge_growth can be used to query
  60    function size/time in the given context.  inline_merge_summary merges
  61    properties of caller and callee after inlining.
  62
  63    Finally pass_inline_parameters is exported.  This is used to drive
  64    computation of function parameters used by the early inliner. IPA
  65    inlined performs analysis via its analyze_function method. */
  66
  67 #include "config.h"
  68 #include "system.h"
  69 #include "coretypes.h"
  70 #include "backend.h"
  71 #include "tree.h"
  72 #include "gimple.h"
  73 #include "alloc-pool.h"
  74 #include "tree-pass.h"
  75 #include "ssa.h"
  76 #include "tree-streamer.h"
  77 #include "cgraph.h"
  78 #include "diagnostic.h"
  79 #include "fold-const.h"
  80 #include "print-tree.h"
  81 #include "tree-inline.h"
  82 #include "gimple-pretty-print.h"
  83 #include "params.h"
  84 #include "cfganal.h"
  85 #include "gimple-iterator.h"
  86 #include "tree-cfg.h"
  87 #include "tree-ssa-loop-niter.h"
  88 #include "tree-ssa-loop.h"
  89 #include "symbol-summary.h"
  90 #include "ipa-prop.h"
  91 #include "ipa-inline.h"
  92 #include "cfgloop.h"
  93 #include "tree-scalar-evolution.h"
  94 #include "ipa-utils.h"
  95 #include "cilk.h"
  96 #include "cfgexpand.h"
  97
  98 /* Estimate runtime of function can easilly run into huge numbers with many
  99    nested loops.  Be sure we can compute time * INLINE_SIZE_SCALE * 2 in an
 100    integer.  For anything larger we use gcov_type.  */
 101 #define MAX_TIME 500000
 102
 103 /* Number of bits in integer, but we really want to be stable across different
 104    hosts.  */
 105 #define NUM_CONDITIONS 32
 106
 107 enum predicate_conditions
 108 {
 109   predicate_false_condition = 0,
 110   predicate_not_inlined_condition = 1,
 111   predicate_first_dynamic_condition = 2
 112 };
 113
 114 /* Special condition code we use to represent test that operand is compile time
 115    constant.  */
 116 #define IS_NOT_CONSTANT ERROR_MARK
 117 /* Special condition code we use to represent test that operand is not changed
 118    across invocation of the function.  When operand IS_NOT_CONSTANT it is always
 119    CHANGED, however i.e. loop invariants can be NOT_CHANGED given percentage
 120    of executions even when they are not compile time constants.  */
 121 #define CHANGED IDENTIFIER_NODE
 122
 123 /* Holders of ipa cgraph hooks: */
 124 static struct cgraph_2edge_hook_list *edge_duplication_hook_holder;
 125 static struct cgraph_edge_hook_list *edge_removal_hook_holder;
 126 static void inline_edge_removal_hook (struct cgraph_edge *, void *);
 127 static void inline_edge_duplication_hook (struct cgraph_edge *,
 128                                           struct cgraph_edge *, void *);
 129
 130 /* VECtor holding inline summaries.
 131    In GGC memory because conditions might point to constant trees.  */
 132 function_summary <inline_summary *> *inline_summaries;
 133 vec<inline_edge_summary_t> inline_edge_summary_vec;
 134
 135 /* Cached node/edge growths.  */
 136 vec<edge_growth_cache_entry> edge_growth_cache;
 137
 138 /* Edge predicates goes here.  */
 139 static object_allocator<predicate> edge_predicate_pool ("edge predicates");
 140
 141 /* Return true predicate (tautology).
 142    We represent it by empty list of clauses.  */
 143
 144 static inline struct predicate
 145 true_predicate (void)
 146 {
 147   struct predicate p;
 148   p.clause[0] = 0;
 149   return p;
 150 }
 151
 152
 153 /* Return predicate testing single condition number COND.  */
 154
 155 static inline struct predicate
 156 single_cond_predicate (int cond)
 157 {
 158   struct predicate p;
 159   p.clause[0] = 1 << cond;
 160   p.clause[1] = 0;
 161   return p;
 162 }
 163
 164
 165 /* Return false predicate.  First clause require false condition.  */
 166
 167 static inline struct predicate
 168 false_predicate (void)
 169 {
 170   return single_cond_predicate (predicate_false_condition);
 171 }
 172
 173
 174 /* Return true if P is (true).  */
 175
 176 static inline bool
 177 true_predicate_p (struct predicate *p)
 178 {
 179   return !p->clause[0];
 180 }
 181
 182
 183 /* Return true if P is (false).  */
 184
 185 static inline bool
 186 false_predicate_p (struct predicate *p)
 187 {
 188   if (p->clause[0] == (1 << predicate_false_condition))
 189     {
 190       gcc_checking_assert (!p->clause[1]
 191                            && p->clause[0] == 1 << predicate_false_condition);
 192       return true;
 193     }
 194   return false;
 195 }
 196
 197
 198 /* Return predicate that is set true when function is not inlined.  */
 199
 200 static inline struct predicate
 201 not_inlined_predicate (void)
 202 {
 203   return single_cond_predicate (predicate_not_inlined_condition);
 204 }
 205
 206 /* Simple description of whether a memory load or a condition refers to a load
 207    from an aggregate and if so, how and where from in the aggregate.
 208    Individual fields have the same meaning like fields with the same name in
 209    struct condition.  */
 210
 211 struct agg_position_info
 212 {
 213   HOST_WIDE_INT offset;
 214   bool agg_contents;
 215   bool by_ref;
 216 };
 217
 218 /* Add condition to condition list CONDS.  AGGPOS describes whether the used
 219    oprand is loaded from an aggregate and where in the aggregate it is.  It can
 220    be NULL, which means this not a load from an aggregate.  */
 221
 222 static struct predicate
 223 add_condition (struct inline_summary *summary, int operand_num,
 224                struct agg_position_info *aggpos,
 225                enum tree_code code, tree val)
 226 {
 227   int i;
 228   struct condition *c;
 229   struct condition new_cond;
 230   HOST_WIDE_INT offset;
 231   bool agg_contents, by_ref;
 232
 233   if (aggpos)
 234     {
 235       offset = aggpos->offset;
 236       agg_contents = aggpos->agg_contents;
 237       by_ref = aggpos->by_ref;
 238     }
 239   else
 240     {
 241       offset = 0;
 242       agg_contents = false;
 243       by_ref = false;
 244     }
 245
 246   gcc_checking_assert (operand_num >= 0);
 247   for (i = 0; vec_safe_iterate (summary->conds, i, &c); i++)
 248     {
 249       if (c->operand_num == operand_num
 250           && c->code == code
 251           && c->val == val
 252           && c->agg_contents == agg_contents
 253           && (!agg_contents || (c->offset == offset && c->by_ref == by_ref)))
 254         return single_cond_predicate (i + predicate_first_dynamic_condition);
 255     }
 256   /* Too many conditions.  Give up and return constant true.  */
 257   if (i == NUM_CONDITIONS - predicate_first_dynamic_condition)
 258     return true_predicate ();
 259
 260   new_cond.operand_num = operand_num;
 261   new_cond.code = code;
 262   new_cond.val = val;
 263   new_cond.agg_contents = agg_contents;
 264   new_cond.by_ref = by_ref;
 265   new_cond.offset = offset;
 266   vec_safe_push (summary->conds, new_cond);
 267   return single_cond_predicate (i + predicate_first_dynamic_condition);
 268 }
 269
 270
 271 /* Add clause CLAUSE into the predicate P.  */
 272
 273 static inline void
 274 add_clause (conditions conditions, struct predicate *p, clause_t clause)
 275 {
 276   int i;
 277   int i2;
 278   int insert_here = -1;
 279   int c1, c2;
 280
 281   /* True clause.  */
 282   if (!clause)
 283     return;
 284
 285   /* False clause makes the whole predicate false.  Kill the other variants.  */
 286   if (clause == (1 << predicate_false_condition))
 287     {
 288       p->clause[0] = (1 << predicate_false_condition);
 289       p->clause[1] = 0;
 290       return;
 291     }
 292   if (false_predicate_p (p))
 293     return;
 294
 295   /* No one should be silly enough to add false into nontrivial clauses.  */
 296   gcc_checking_assert (!(clause & (1 << predicate_false_condition)));
 297
 298   /* Look where to insert the clause.  At the same time prune out
 299      clauses of P that are implied by the new clause and thus
 300      redundant.  */
 301   for (i = 0, i2 = 0; i <= MAX_CLAUSES; i++)
 302     {
 303       p->clause[i2] = p->clause[i];
 304
 305       if (!p->clause[i])
 306         break;
 307
 308       /* If p->clause[i] implies clause, there is nothing to add.  */
 309       if ((p->clause[i] & clause) == p->clause[i])
 310         {
 311           /* We had nothing to add, none of clauses should've become
 312              redundant.  */
 313           gcc_checking_assert (i == i2);
 314           return;
 315         }
 316
 317       if (p->clause[i] < clause && insert_here < 0)
 318         insert_here = i2;
 319
 320       /* If clause implies p->clause[i], then p->clause[i] becomes redundant.
 321          Otherwise the p->clause[i] has to stay.  */
 322       if ((p->clause[i] & clause) != clause)
 323         i2++;
 324     }
 325
 326   /* Look for clauses that are obviously true.  I.e.
 327      op0 == 5 || op0 != 5.  */
 328   for (c1 = predicate_first_dynamic_condition; c1 < NUM_CONDITIONS; c1++)
 329     {
 330       condition *cc1;
 331       if (!(clause & (1 << c1)))
 332         continue;
 333       cc1 = &(*conditions)[c1 - predicate_first_dynamic_condition];
 334       /* We have no way to represent !CHANGED and !IS_NOT_CONSTANT
 335          and thus there is no point for looking for them.  */
 336       if (cc1->code == CHANGED || cc1->code == IS_NOT_CONSTANT)
 337         continue;
 338       for (c2 = c1 + 1; c2 < NUM_CONDITIONS; c2++)
 339         if (clause & (1 << c2))
 340           {
 341             condition *cc1 =
 342               &(*conditions)[c1 - predicate_first_dynamic_condition];
 343             condition *cc2 =
 344               &(*conditions)[c2 - predicate_first_dynamic_condition];
 345             if (cc1->operand_num == cc2->operand_num
 346                 && cc1->val == cc2->val
 347                 && cc2->code != IS_NOT_CONSTANT
 348                 && cc2->code != CHANGED
 349                 && cc1->code == invert_tree_comparison (cc2->code,
 350                                                         HONOR_NANS (cc1->val)))
 351               return;
 352           }
 353     }
 354
 355
 356   /* We run out of variants.  Be conservative in positive direction.  */
 357   if (i2 == MAX_CLAUSES)
 358     return;
 359   /* Keep clauses in decreasing order. This makes equivalence testing easy.  */
 360   p->clause[i2 + 1] = 0;
 361   if (insert_here >= 0)
 362     for (; i2 > insert_here; i2--)
 363       p->clause[i2] = p->clause[i2 - 1];
 364   else
 365     insert_here = i2;
 366   p->clause[insert_here] = clause;
 367 }
 368
 369
 370 /* Return P & P2.  */
 371
 372 static struct predicate
 373 and_predicates (conditions conditions,
 374                 struct predicate *p, struct predicate *p2)
 375 {
 376   struct predicate out = *p;
 377   int i;
 378
 379   /* Avoid busy work.  */
 380   if (false_predicate_p (p2) || true_predicate_p (p))
 381     return *p2;
 382   if (false_predicate_p (p) || true_predicate_p (p2))
 383     return *p;
 384
 385   /* See how far predicates match.  */
 386   for (i = 0; p->clause[i] && p->clause[i] == p2->clause[i]; i++)
 387     {
 388       gcc_checking_assert (i < MAX_CLAUSES);
 389     }
 390
 391   /* Combine the predicates rest.  */
 392   for (; p2->clause[i]; i++)
 393     {
 394       gcc_checking_assert (i < MAX_CLAUSES);
 395       add_clause (conditions, &out, p2->clause[i]);
 396     }
 397   return out;
 398 }
 399
 400
 401 /* Return true if predicates are obviously equal.  */
 402
 403 static inline bool
 404 predicates_equal_p (struct predicate *p, struct predicate *p2)
 405 {
 406   int i;
 407   for (i = 0; p->clause[i]; i++)
 408     {
 409       gcc_checking_assert (i < MAX_CLAUSES);
 410       gcc_checking_assert (p->clause[i] > p->clause[i + 1]);
 411       gcc_checking_assert (!p2->clause[i]
 412                            || p2->clause[i] > p2->clause[i + 1]);
 413       if (p->clause[i] != p2->clause[i])
 414         return false;
 415     }
 416   return !p2->clause[i];
 417 }
 418
 419
 420 /* Return P | P2.  */
 421
 422 static struct predicate
 423 or_predicates (conditions conditions,
 424                struct predicate *p, struct predicate *p2)
 425 {
 426   struct predicate out = true_predicate ();
 427   int i, j;
 428
 429   /* Avoid busy work.  */
 430   if (false_predicate_p (p2) || true_predicate_p (p))
 431     return *p;
 432   if (false_predicate_p (p) || true_predicate_p (p2))
 433     return *p2;
 434   if (predicates_equal_p (p, p2))
 435     return *p;
 436
 437   /* OK, combine the predicates.  */
 438   for (i = 0; p->clause[i]; i++)
 439     for (j = 0; p2->clause[j]; j++)
 440       {
 441         gcc_checking_assert (i < MAX_CLAUSES && j < MAX_CLAUSES);
 442         add_clause (conditions, &out, p->clause[i] | p2->clause[j]);
 443       }
 444   return out;
 445 }
 446
 447
 448 /* Having partial truth assignment in POSSIBLE_TRUTHS, return false
 449    if predicate P is known to be false.  */
 450
 451 static bool
 452 evaluate_predicate (struct predicate *p, clause_t possible_truths)
 453 {
 454   int i;
 455
 456   /* True remains true.  */
 457   if (true_predicate_p (p))
 458     return true;
 459
 460   gcc_assert (!(possible_truths & (1 << predicate_false_condition)));
 461
 462   /* See if we can find clause we can disprove.  */
 463   for (i = 0; p->clause[i]; i++)
 464     {
 465       gcc_checking_assert (i < MAX_CLAUSES);
 466       if (!(p->clause[i] & possible_truths))
 467         return false;
 468     }
 469   return true;
 470 }
 471
 472 /* Return the probability in range 0...REG_BR_PROB_BASE that the predicated
 473    instruction will be recomputed per invocation of the inlined call.  */
 474
 475 static int
 476 predicate_probability (conditions conds,
 477                        struct predicate *p, clause_t possible_truths,
 478                        vec<inline_param_summary> inline_param_summary)
 479 {
 480   int i;
 481   int combined_prob = REG_BR_PROB_BASE;
 482
 483   /* True remains true.  */
 484   if (true_predicate_p (p))
 485     return REG_BR_PROB_BASE;
 486
 487   if (false_predicate_p (p))
 488     return 0;
 489
 490   gcc_assert (!(possible_truths & (1 << predicate_false_condition)));
 491
 492   /* See if we can find clause we can disprove.  */
 493   for (i = 0; p->clause[i]; i++)
 494     {
 495       gcc_checking_assert (i < MAX_CLAUSES);
 496       if (!(p->clause[i] & possible_truths))
 497         return 0;
 498       else
 499         {
 500           int this_prob = 0;
 501           int i2;
 502           if (!inline_param_summary.exists ())
 503             return REG_BR_PROB_BASE;
 504           for (i2 = 0; i2 < NUM_CONDITIONS; i2++)
 505             if ((p->clause[i] & possible_truths) & (1 << i2))
 506               {
 507                 if (i2 >= predicate_first_dynamic_condition)
 508                   {
 509                     condition *c =
 510                       &(*conds)[i2 - predicate_first_dynamic_condition];
 511                     if (c->code == CHANGED
 512                         && (c->operand_num <
 513                             (int) inline_param_summary.length ()))
 514                       {
 515                         int iprob =
 516                           inline_param_summary[c->operand_num].change_prob;
 517                         this_prob = MAX (this_prob, iprob);
 518                       }
 519                     else
 520                       this_prob = REG_BR_PROB_BASE;
 521                   }
 522                 else
 523                   this_prob = REG_BR_PROB_BASE;
 524               }
 525           combined_prob = MIN (this_prob, combined_prob);
 526           if (!combined_prob)
 527             return 0;
 528         }
 529     }
 530   return combined_prob;
 531 }
 532
 533
 534 /* Dump conditional COND.  */
 535
 536 static void
 537 dump_condition (FILE *f, conditions conditions, int cond)
 538 {
 539   condition *c;
 540   if (cond == predicate_false_condition)
 541     fprintf (f, "false");
 542   else if (cond == predicate_not_inlined_condition)
 543     fprintf (f, "not inlined");
 544   else
 545     {
 546       c = &(*conditions)[cond - predicate_first_dynamic_condition];
 547       fprintf (f, "op%i", c->operand_num);
 548       if (c->agg_contents)
 549         fprintf (f, "[%soffset: " HOST_WIDE_INT_PRINT_DEC "]",
 550                  c->by_ref ? "ref " : "", c->offset);
 551       if (c->code == IS_NOT_CONSTANT)
 552         {
 553           fprintf (f, " not constant");
 554           return;
 555         }
 556       if (c->code == CHANGED)
 557         {
 558           fprintf (f, " changed");
 559           return;
 560         }
 561       fprintf (f, " %s ", op_symbol_code (c->code));
 562       print_generic_expr (f, c->val, 1);
 563     }
 564 }
 565
 566
 567 /* Dump clause CLAUSE.  */
 568
 569 static void
 570 dump_clause (FILE *f, conditions conds, clause_t clause)
 571 {
 572   int i;
 573   bool found = false;
 574   fprintf (f, "(");
 575   if (!clause)
 576     fprintf (f, "true");
 577   for (i = 0; i < NUM_CONDITIONS; i++)
 578     if (clause & (1 << i))
 579       {
 580         if (found)
 581           fprintf (f, " || ");
 582         found = true;
 583         dump_condition (f, conds, i);
 584       }
 585   fprintf (f, ")");
 586 }
 587
 588
 589 /* Dump predicate PREDICATE.  */
 590
 591 static void
 592 dump_predicate (FILE *f, conditions conds, struct predicate *pred)
 593 {
 594   int i;
 595   if (true_predicate_p (pred))
 596     dump_clause (f, conds, 0);
 597   else
 598     for (i = 0; pred->clause[i]; i++)
 599       {
 600         if (i)
 601           fprintf (f, " && ");
 602         dump_clause (f, conds, pred->clause[i]);
 603       }
 604   fprintf (f, "\n");
 605 }
 606
 607
 608 /* Dump inline hints.  */
 609 void
 610 dump_inline_hints (FILE *f, inline_hints hints)
 611 {
 612   if (!hints)
 613     return;
 614   fprintf (f, "inline hints:");
 615   if (hints & INLINE_HINT_indirect_call)
 616     {
 617       hints &= ~INLINE_HINT_indirect_call;
 618       fprintf (f, " indirect_call");
 619     }
 620   if (hints & INLINE_HINT_loop_iterations)
 621     {
 622       hints &= ~INLINE_HINT_loop_iterations;
 623       fprintf (f, " loop_iterations");
 624     }
 625   if (hints & INLINE_HINT_loop_stride)
 626     {
 627       hints &= ~INLINE_HINT_loop_stride;
 628       fprintf (f, " loop_stride");
 629     }
 630   if (hints & INLINE_HINT_same_scc)
 631     {
 632       hints &= ~INLINE_HINT_same_scc;
 633       fprintf (f, " same_scc");
 634     }
 635   if (hints & INLINE_HINT_in_scc)
 636     {
 637       hints &= ~INLINE_HINT_in_scc;
 638       fprintf (f, " in_scc");
 639     }
 640   if (hints & INLINE_HINT_cross_module)
 641     {
 642       hints &= ~INLINE_HINT_cross_module;
 643       fprintf (f, " cross_module");
 644     }
 645   if (hints & INLINE_HINT_declared_inline)
 646     {
 647       hints &= ~INLINE_HINT_declared_inline;
 648       fprintf (f, " declared_inline");
 649     }
 650   if (hints & INLINE_HINT_array_index)
 651     {
 652       hints &= ~INLINE_HINT_array_index;
 653       fprintf (f, " array_index");
 654     }
 655   if (hints & INLINE_HINT_known_hot)
 656     {
 657       hints &= ~INLINE_HINT_known_hot;
 658       fprintf (f, " known_hot");
 659     }
 660   gcc_assert (!hints);
 661 }
 662
 663
 664 /* Record SIZE and TIME under condition PRED into the inline summary.  */
 665
 666 static void
 667 account_size_time (struct inline_summary *summary, int size, int time,
 668                    struct predicate *pred)
 669 {
 670   size_time_entry *e;
 671   bool found = false;
 672   int i;
 673
 674   if (false_predicate_p (pred))
 675     return;
 676
 677   /* We need to create initial empty unconitional clause, but otherwie
 678      we don't need to account empty times and sizes.  */
 679   if (!size && !time && summary->entry)
 680     return;
 681
 682   /* Watch overflow that might result from insane profiles.  */
 683   if (time > MAX_TIME * INLINE_TIME_SCALE)
 684     time = MAX_TIME * INLINE_TIME_SCALE;
 685   gcc_assert (time >= 0);
 686
 687   for (i = 0; vec_safe_iterate (summary->entry, i, &e); i++)
 688     if (predicates_equal_p (&e->predicate, pred))
 689       {
 690         found = true;
 691         break;
 692       }
 693   if (i == 256)
 694     {
 695       i = 0;
 696       found = true;
 697       e = &(*summary->entry)[0];
 698       gcc_assert (!e->predicate.clause[0]);
 699       if (dump_file && (dump_flags & TDF_DETAILS))
 700         fprintf (dump_file,
 701                  "\t\tReached limit on number of entries, "
 702                  "ignoring the predicate.");
 703     }
 704   if (dump_file && (dump_flags & TDF_DETAILS) && (time || size))
 705     {
 706       fprintf (dump_file,
 707                "\t\tAccounting size:%3.2f, time:%3.2f on %spredicate:",
 708                ((double) size) / INLINE_SIZE_SCALE,
 709                ((double) time) / INLINE_TIME_SCALE, found ? "" : "new ");
 710       dump_predicate (dump_file, summary->conds, pred);
 711     }
 712   if (!found)
 713     {
 714       struct size_time_entry new_entry;
 715       new_entry.size = size;
 716       new_entry.time = time;
 717       new_entry.predicate = *pred;
 718       vec_safe_push (summary->entry, new_entry);
 719     }
 720   else
 721     {
 722       e->size += size;
 723       e->time += time;
 724       if (e->time > MAX_TIME * INLINE_TIME_SCALE)
 725         e->time = MAX_TIME * INLINE_TIME_SCALE;
 726     }
 727 }
 728
 729 /* We proved E to be unreachable, redirect it to __bultin_unreachable.  */
 730
 731 static struct cgraph_edge *
 732 redirect_to_unreachable (struct cgraph_edge *e)
 733 {
 734   struct cgraph_node *callee = !e->inline_failed ? e->callee : NULL;
 735   struct cgraph_node *target = cgraph_node::get_create
 736                       (builtin_decl_implicit (BUILT_IN_UNREACHABLE));
 737
 738   if (e->speculative)
 739     e = e->resolve_speculation (target->decl);
 740   else if (!e->callee)
 741     e->make_direct (target);
 742   else
 743     e->redirect_callee (target);
 744   struct inline_edge_summary *es = inline_edge_summary (e);
 745   e->inline_failed = CIF_UNREACHABLE;
 746   e->frequency = 0;
 747   e->count = 0;
 748   es->call_stmt_size = 0;
 749   es->call_stmt_time = 0;
 750   if (callee)
 751     callee->remove_symbol_and_inline_clones ();
 752   return e;
 753 }
 754
 755 /* Set predicate for edge E.  */
 756
 757 static void
 758 edge_set_predicate (struct cgraph_edge *e, struct predicate *predicate)
 759 {
 760   /* If the edge is determined to be never executed, redirect it
 761      to BUILTIN_UNREACHABLE to save inliner from inlining into it.  */
 762   if (predicate && false_predicate_p (predicate)
 763       /* When handling speculative edges, we need to do the redirection
 764          just once.  Do it always on the direct edge, so we do not
 765          attempt to resolve speculation while duplicating the edge.  */
 766       && (!e->speculative || e->callee))
 767     e = redirect_to_unreachable (e);
 768
 769   struct inline_edge_summary *es = inline_edge_summary (e);
 770   if (predicate && !true_predicate_p (predicate))
 771     {
 772       if (!es->predicate)
 773         es->predicate = edge_predicate_pool.allocate ();
 774       *es->predicate = *predicate;
 775     }
 776   else
 777     {
 778       if (es->predicate)
 779         edge_predicate_pool.remove (es->predicate);
 780       es->predicate = NULL;
 781     }
 782 }
 783
 784 /* Set predicate for hint *P.  */
 785
 786 static void
 787 set_hint_predicate (struct predicate **p, struct predicate new_predicate)
 788 {
 789   if (false_predicate_p (&new_predicate) || true_predicate_p (&new_predicate))
 790     {
 791       if (*p)
 792         edge_predicate_pool.remove (*p);
 793       *p = NULL;
 794     }
 795   else
 796     {
 797       if (!*p)
 798         *p = edge_predicate_pool.allocate ();
 799       **p = new_predicate;
 800     }
 801 }
 802
 803
 804 /* KNOWN_VALS is partial mapping of parameters of NODE to constant values.
 805    KNOWN_AGGS is a vector of aggreggate jump functions for each parameter.
 806    Return clause of possible truths. When INLINE_P is true, assume that we are
 807    inlining.
 808
 809    ERROR_MARK means compile time invariant.  */
 810
 811 static clause_t
 812 evaluate_conditions_for_known_args (struct cgraph_node *node,
 813                                     bool inline_p,
 814                                     vec<tree> known_vals,
 815                                     vec<ipa_agg_jump_function_p>
 816                                     known_aggs)
 817 {
 818   clause_t clause = inline_p ? 0 : 1 << predicate_not_inlined_condition;
 819   struct inline_summary *info = inline_summaries->get (node);
 820   int i;
 821   struct condition *c;
 822
 823   for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
 824     {
 825       tree val;
 826       tree res;
 827
 828       /* We allow call stmt to have fewer arguments than the callee function
 829          (especially for K&R style programs).  So bound check here (we assume
 830          known_aggs vector, if non-NULL, has the same length as
 831          known_vals).  */
 832       gcc_checking_assert (!known_aggs.exists ()
 833                            || (known_vals.length () == known_aggs.length ()));
 834       if (c->operand_num >= (int) known_vals.length ())
 835         {
 836           clause |= 1 << (i + predicate_first_dynamic_condition);
 837           continue;
 838         }
 839
 840       if (c->agg_contents)
 841         {
 842           struct ipa_agg_jump_function *agg;
 843
 844           if (c->code == CHANGED
 845               && !c->by_ref
 846               && (known_vals[c->operand_num] == error_mark_node))
 847             continue;
 848
 849           if (known_aggs.exists ())
 850             {
 851               agg = known_aggs[c->operand_num];
 852               val = ipa_find_agg_cst_for_param (agg, c->offset, c->by_ref);
 853             }
 854           else
 855             val = NULL_TREE;
 856         }
 857       else
 858         {
 859           val = known_vals[c->operand_num];
 860           if (val == error_mark_node && c->code != CHANGED)
 861             val = NULL_TREE;
 862         }
 863
 864       if (!val)
 865         {
 866           clause |= 1 << (i + predicate_first_dynamic_condition);
 867           continue;
 868         }
 869       if (c->code == IS_NOT_CONSTANT || c->code == CHANGED)
 870         continue;
 871
 872       if (operand_equal_p (TYPE_SIZE (TREE_TYPE (c->val)),
 873                            TYPE_SIZE (TREE_TYPE (val)), 0))
 874         {
 875           val = fold_unary (VIEW_CONVERT_EXPR, TREE_TYPE (c->val), val);
 876
 877           res = val
 878             ? fold_binary_to_constant (c->code, boolean_type_node, val, c->val)
 879             : NULL;
 880
 881           if (res && integer_zerop (res))
 882             continue;
 883         }
 884       clause |= 1 << (i + predicate_first_dynamic_condition);
 885     }
 886   return clause;
 887 }
 888
 889
 890 /* Work out what conditions might be true at invocation of E.  */
 891
 892 static void
 893 evaluate_properties_for_edge (struct cgraph_edge *e, bool inline_p,
 894                               clause_t *clause_ptr,
 895                               vec<tree> *known_vals_ptr,
 896                               vec<ipa_polymorphic_call_context>
 897                               *known_contexts_ptr,
 898                               vec<ipa_agg_jump_function_p> *known_aggs_ptr)
 899 {
 900   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 901   struct inline_summary *info = inline_summaries->get (callee);
 902   vec<tree> known_vals = vNULL;
 903   vec<ipa_agg_jump_function_p> known_aggs = vNULL;
 904
 905   if (clause_ptr)
 906     *clause_ptr = inline_p ? 0 : 1 << predicate_not_inlined_condition;
 907   if (known_vals_ptr)
 908     known_vals_ptr->create (0);
 909   if (known_contexts_ptr)
 910     known_contexts_ptr->create (0);
 911
 912   if (ipa_node_params_sum
 913       && !e->call_stmt_cannot_inline_p
 914       && ((clause_ptr && info->conds) || known_vals_ptr || known_contexts_ptr))
 915     {
 916       struct ipa_node_params *parms_info;
 917       struct ipa_edge_args *args = IPA_EDGE_REF (e);
 918       struct inline_edge_summary *es = inline_edge_summary (e);
 919       int i, count = ipa_get_cs_argument_count (args);
 920
 921       if (e->caller->global.inlined_to)
 922         parms_info = IPA_NODE_REF (e->caller->global.inlined_to);
 923       else
 924         parms_info = IPA_NODE_REF (e->caller);
 925
 926       if (count && (info->conds || known_vals_ptr))
 927         known_vals.safe_grow_cleared (count);
 928       if (count && (info->conds || known_aggs_ptr))
 929         known_aggs.safe_grow_cleared (count);
 930       if (count && known_contexts_ptr)
 931         known_contexts_ptr->safe_grow_cleared (count);
 932
 933       for (i = 0; i < count; i++)
 934         {
 935           struct ipa_jump_func *jf = ipa_get_ith_jump_func (args, i);
 936           tree cst = ipa_value_from_jfunc (parms_info, jf);
 937
 938           if (!cst && e->call_stmt
 939               && i < (int)gimple_call_num_args (e->call_stmt))
 940             {
 941               cst = gimple_call_arg (e->call_stmt, i);
 942               if (!is_gimple_min_invariant (cst))
 943                 cst = NULL;
 944             }
 945           if (cst)
 946             {
 947               gcc_checking_assert (TREE_CODE (cst) != TREE_BINFO);
 948               if (known_vals.exists ())
 949                 known_vals[i] = cst;
 950             }
 951           else if (inline_p && !es->param[i].change_prob)
 952             known_vals[i] = error_mark_node;
 953
 954           if (known_contexts_ptr)
 955             (*known_contexts_ptr)[i] = ipa_context_from_jfunc (parms_info, e,
 956                                                                i, jf);
 957           /* TODO: When IPA-CP starts propagating and merging aggregate jump
 958              functions, use its knowledge of the caller too, just like the
 959              scalar case above.  */
 960           known_aggs[i] = &jf->agg;
 961         }
 962     }
 963   else if (e->call_stmt && !e->call_stmt_cannot_inline_p
 964            && ((clause_ptr && info->conds) || known_vals_ptr))
 965     {
 966       int i, count = (int)gimple_call_num_args (e->call_stmt);
 967
 968       if (count && (info->conds || known_vals_ptr))
 969         known_vals.safe_grow_cleared (count);
 970       for (i = 0; i < count; i++)
 971         {
 972           tree cst = gimple_call_arg (e->call_stmt, i);
 973           if (!is_gimple_min_invariant (cst))
 974             cst = NULL;
 975           if (cst)
 976             known_vals[i] = cst;
 977         }
 978     }
 979
 980   if (clause_ptr)
 981     *clause_ptr = evaluate_conditions_for_known_args (callee, inline_p,
 982                                                       known_vals, known_aggs);
 983
 984   if (known_vals_ptr)
 985     *known_vals_ptr = known_vals;
 986   else
 987     known_vals.release ();
 988
 989   if (known_aggs_ptr)
 990     *known_aggs_ptr = known_aggs;
 991   else
 992     known_aggs.release ();
 993 }
 994
 995
 996 /* Allocate the inline summary vector or resize it to cover all cgraph nodes. */
 997
 998 static void
 999 inline_summary_alloc (void)
1000 {
1001   if (!edge_removal_hook_holder)
1002     edge_removal_hook_holder =
1003       symtab->add_edge_removal_hook (&inline_edge_removal_hook, NULL);
1004   if (!edge_duplication_hook_holder)
1005     edge_duplication_hook_holder =
1006       symtab->add_edge_duplication_hook (&inline_edge_duplication_hook, NULL);
1007
1008   if (!inline_summaries)
1009     inline_summaries = (inline_summary_t*) inline_summary_t::create_ggc (symtab);
1010
1011   if (inline_edge_summary_vec.length () <= (unsigned) symtab->edges_max_uid)
1012     inline_edge_summary_vec.safe_grow_cleared (symtab->edges_max_uid + 1);
1013 }
1014
1015 /* We are called multiple time for given function; clear
1016    data from previous run so they are not cumulated.  */
1017
1018 static void
1019 reset_inline_edge_summary (struct cgraph_edge *e)
1020 {
1021   if (e->uid < (int) inline_edge_summary_vec.length ())
1022     {
1023       struct inline_edge_summary *es = inline_edge_summary (e);
1024
1025       es->call_stmt_size = es->call_stmt_time = 0;
1026       if (es->predicate)
1027         edge_predicate_pool.remove (es->predicate);
1028       es->predicate = NULL;
1029       es->param.release ();
1030     }
1031 }
1032
1033 /* We are called multiple time for given function; clear
1034    data from previous run so they are not cumulated.  */
1035
1036 static void
1037 reset_inline_summary (struct cgraph_node *node,
1038                       inline_summary *info)
1039 {
1040   struct cgraph_edge *e;
1041
1042   info->self_size = info->self_time = 0;
1043   info->estimated_stack_size = 0;
1044   info->estimated_self_stack_size = 0;
1045   info->stack_frame_offset = 0;
1046   info->size = 0;
1047   info->time = 0;
1048   info->growth = 0;
1049   info->scc_no = 0;
1050   if (info->loop_iterations)
1051     {
1052       edge_predicate_pool.remove (info->loop_iterations);
1053       info->loop_iterations = NULL;
1054     }
1055   if (info->loop_stride)
1056     {
1057       edge_predicate_pool.remove (info->loop_stride);
1058       info->loop_stride = NULL;
1059     }
1060   if (info->array_index)
1061     {
1062       edge_predicate_pool.remove (info->array_index);
1063       info->array_index = NULL;
1064     }
1065   vec_free (info->conds);
1066   vec_free (info->entry);
1067   for (e = node->callees; e; e = e->next_callee)
1068     reset_inline_edge_summary (e);
1069   for (e = node->indirect_calls; e; e = e->next_callee)
1070     reset_inline_edge_summary (e);
1071 }
1072
1073 /* Hook that is called by cgraph.c when a node is removed.  */
1074
1075 void
1076 inline_summary_t::remove (cgraph_node *node, inline_summary *info)
1077 {
1078   reset_inline_summary (node, info);
1079 }
1080
1081 /* Remap predicate P of former function to be predicate of duplicated function.
1082    POSSIBLE_TRUTHS is clause of possible truths in the duplicated node,
1083    INFO is inline summary of the duplicated node.  */
1084
1085 static struct predicate
1086 remap_predicate_after_duplication (struct predicate *p,
1087                                    clause_t possible_truths,
1088                                    struct inline_summary *info)
1089 {
1090   struct predicate new_predicate = true_predicate ();
1091   int j;
1092   for (j = 0; p->clause[j]; j++)
1093     if (!(possible_truths & p->clause[j]))
1094       {
1095         new_predicate = false_predicate ();
1096         break;
1097       }
1098     else
1099       add_clause (info->conds, &new_predicate,
1100                   possible_truths & p->clause[j]);
1101   return new_predicate;
1102 }
1103
1104 /* Same as remap_predicate_after_duplication but handle hint predicate *P.
1105    Additionally care about allocating new memory slot for updated predicate
1106    and set it to NULL when it becomes true or false (and thus uninteresting).
1107  */
1108
1109 static void
1110 remap_hint_predicate_after_duplication (struct predicate **p,
1111                                         clause_t possible_truths,
1112                                         struct inline_summary *info)
1113 {
1114   struct predicate new_predicate;
1115
1116   if (!*p)
1117     return;
1118
1119   new_predicate = remap_predicate_after_duplication (*p,
1120                                                      possible_truths, info);
1121   /* We do not want to free previous predicate; it is used by node origin.  */
1122   *p = NULL;
1123   set_hint_predicate (p, new_predicate);
1124 }
1125
1126
1127 /* Hook that is called by cgraph.c when a node is duplicated.  */
1128 void
1129 inline_summary_t::duplicate (cgraph_node *src,
1130                              cgraph_node *dst,
1131                              inline_summary *,
1132                              inline_summary *info)
1133 {
1134   inline_summary_alloc ();
1135   memcpy (info, inline_summaries->get (src), sizeof (inline_summary));
1136   /* TODO: as an optimization, we may avoid copying conditions
1137      that are known to be false or true.  */
1138   info->conds = vec_safe_copy (info->conds);
1139
1140   /* When there are any replacements in the function body, see if we can figure
1141      out that something was optimized out.  */
1142   if (ipa_node_params_sum && dst->clone.tree_map)
1143     {
1144       vec<size_time_entry, va_gc> *entry = info->entry;
1145       /* Use SRC parm info since it may not be copied yet.  */
1146       struct ipa_node_params *parms_info = IPA_NODE_REF (src);
1147       vec<tree> known_vals = vNULL;
1148       int count = ipa_get_param_count (parms_info);
1149       int i, j;
1150       clause_t possible_truths;
1151       struct predicate true_pred = true_predicate ();
1152       size_time_entry *e;
1153       int optimized_out_size = 0;
1154       bool inlined_to_p = false;
1155       struct cgraph_edge *edge, *next;
1156
1157       info->entry = 0;
1158       known_vals.safe_grow_cleared (count);
1159       for (i = 0; i < count; i++)
1160         {
1161           struct ipa_replace_map *r;
1162
1163           for (j = 0; vec_safe_iterate (dst->clone.tree_map, j, &r); j++)
1164             {
1165               if (((!r->old_tree && r->parm_num == i)
1166                    || (r->old_tree && r->old_tree == ipa_get_param (parms_info, i)))
1167                    && r->replace_p && !r->ref_p)
1168                 {
1169                   known_vals[i] = r->new_tree;
1170                   break;
1171                 }
1172             }
1173         }
1174       possible_truths = evaluate_conditions_for_known_args (dst, false,
1175                                                             known_vals,
1176                                                             vNULL);
1177       known_vals.release ();
1178
1179       account_size_time (info, 0, 0, &true_pred);
1180
1181       /* Remap size_time vectors.
1182          Simplify the predicate by prunning out alternatives that are known
1183          to be false.
1184          TODO: as on optimization, we can also eliminate conditions known
1185          to be true.  */
1186       for (i = 0; vec_safe_iterate (entry, i, &e); i++)
1187         {
1188           struct predicate new_predicate;
1189           new_predicate = remap_predicate_after_duplication (&e->predicate,
1190                                                              possible_truths,
1191                                                              info);
1192           if (false_predicate_p (&new_predicate))
1193             optimized_out_size += e->size;
1194           else
1195             account_size_time (info, e->size, e->time, &new_predicate);
1196         }
1197
1198       /* Remap edge predicates with the same simplification as above.
1199          Also copy constantness arrays.   */
1200       for (edge = dst->callees; edge; edge = next)
1201         {
1202           struct predicate new_predicate;
1203           struct inline_edge_summary *es = inline_edge_summary (edge);
1204           next = edge->next_callee;
1205
1206           if (!edge->inline_failed)
1207             inlined_to_p = true;
1208           if (!es->predicate)
1209             continue;
1210           new_predicate = remap_predicate_after_duplication (es->predicate,
1211                                                              possible_truths,
1212                                                              info);
1213           if (false_predicate_p (&new_predicate)
1214               && !false_predicate_p (es->predicate))
1215             optimized_out_size += es->call_stmt_size * INLINE_SIZE_SCALE;
1216           edge_set_predicate (edge, &new_predicate);
1217         }
1218
1219       /* Remap indirect edge predicates with the same simplificaiton as above.
1220          Also copy constantness arrays.   */
1221       for (edge = dst->indirect_calls; edge; edge = next)
1222         {
1223           struct predicate new_predicate;
1224           struct inline_edge_summary *es = inline_edge_summary (edge);
1225           next = edge->next_callee;
1226
1227           gcc_checking_assert (edge->inline_failed);
1228           if (!es->predicate)
1229             continue;
1230           new_predicate = remap_predicate_after_duplication (es->predicate,
1231                                                              possible_truths,
1232                                                              info);
1233           if (false_predicate_p (&new_predicate)
1234               && !false_predicate_p (es->predicate))
1235             optimized_out_size += es->call_stmt_size * INLINE_SIZE_SCALE;
1236           edge_set_predicate (edge, &new_predicate);
1237         }
1238       remap_hint_predicate_after_duplication (&info->loop_iterations,
1239                                               possible_truths, info);
1240       remap_hint_predicate_after_duplication (&info->loop_stride,
1241                                               possible_truths, info);
1242       remap_hint_predicate_after_duplication (&info->array_index,
1243                                               possible_truths, info);
1244
1245       /* If inliner or someone after inliner will ever start producing
1246          non-trivial clones, we will get trouble with lack of information
1247          about updating self sizes, because size vectors already contains
1248          sizes of the calees.  */
1249       gcc_assert (!inlined_to_p || !optimized_out_size);
1250     }
1251   else
1252     {
1253       info->entry = vec_safe_copy (info->entry);
1254       if (info->loop_iterations)
1255         {
1256           predicate p = *info->loop_iterations;
1257           info->loop_iterations = NULL;
1258           set_hint_predicate (&info->loop_iterations, p);
1259         }
1260       if (info->loop_stride)
1261         {
1262           predicate p = *info->loop_stride;
1263           info->loop_stride = NULL;
1264           set_hint_predicate (&info->loop_stride, p);
1265         }
1266       if (info->array_index)
1267         {
1268           predicate p = *info->array_index;
1269           info->array_index = NULL;
1270           set_hint_predicate (&info->array_index, p);
1271         }
1272     }
1273   if (!dst->global.inlined_to)
1274     inline_update_overall_summary (dst);
1275 }
1276
1277
1278 /* Hook that is called by cgraph.c when a node is duplicated.  */
1279
1280 static void
1281 inline_edge_duplication_hook (struct cgraph_edge *src,
1282                               struct cgraph_edge *dst,
1283                               ATTRIBUTE_UNUSED void *data)
1284 {
1285   struct inline_edge_summary *info;
1286   struct inline_edge_summary *srcinfo;
1287   inline_summary_alloc ();
1288   info = inline_edge_summary (dst);
1289   srcinfo = inline_edge_summary (src);
1290   memcpy (info, srcinfo, sizeof (struct inline_edge_summary));
1291   info->predicate = NULL;
1292   edge_set_predicate (dst, srcinfo->predicate);
1293   info->param = srcinfo->param.copy ();
1294   if (!dst->indirect_unknown_callee && src->indirect_unknown_callee)
1295     {
1296       info->call_stmt_size -= (eni_size_weights.indirect_call_cost
1297                                - eni_size_weights.call_cost);
1298       info->call_stmt_time -= (eni_time_weights.indirect_call_cost
1299                                - eni_time_weights.call_cost);
1300     }
1301 }
1302
1303
1304 /* Keep edge cache consistent across edge removal.  */
1305
1306 static void
1307 inline_edge_removal_hook (struct cgraph_edge *edge,
1308                           void *data ATTRIBUTE_UNUSED)
1309 {
1310   if (edge_growth_cache.exists ())
1311     reset_edge_growth_cache (edge);
1312   reset_inline_edge_summary (edge);
1313 }
1314
1315
1316 /* Initialize growth caches.  */
1317
1318 void
1319 initialize_growth_caches (void)
1320 {
1321   if (symtab->edges_max_uid)
1322     edge_growth_cache.safe_grow_cleared (symtab->edges_max_uid);
1323 }
1324
1325
1326 /* Free growth caches.  */
1327
1328 void
1329 free_growth_caches (void)
1330 {
1331   edge_growth_cache.release ();
1332 }
1333
1334
1335 /* Dump edge summaries associated to NODE and recursively to all clones.
1336    Indent by INDENT.  */
1337
1338 static void
1339 dump_inline_edge_summary (FILE *f, int indent, struct cgraph_node *node,
1340                           struct inline_summary *info)
1341 {
1342   struct cgraph_edge *edge;
1343   for (edge = node->callees; edge; edge = edge->next_callee)
1344     {
1345       struct inline_edge_summary *es = inline_edge_summary (edge);
1346       struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
1347       int i;
1348
1349       fprintf (f,
1350                "%*s%s/%i %s\n%*s  loop depth:%2i freq:%4i size:%2i"
1351                " time: %2i callee size:%2i stack:%2i",
1352                indent, "", callee->name (), callee->order,
1353                !edge->inline_failed
1354                ? "inlined" : cgraph_inline_failed_string (edge-> inline_failed),
1355                indent, "", es->loop_depth, edge->frequency,
1356                es->call_stmt_size, es->call_stmt_time,
1357                (int) inline_summaries->get (callee)->size / INLINE_SIZE_SCALE,
1358                (int) inline_summaries->get (callee)->estimated_stack_size);
1359
1360       if (es->predicate)
1361         {
1362           fprintf (f, " predicate: ");
1363           dump_predicate (f, info->conds, es->predicate);
1364         }
1365       else
1366         fprintf (f, "\n");
1367       if (es->param.exists ())
1368         for (i = 0; i < (int) es->param.length (); i++)
1369           {
1370             int prob = es->param[i].change_prob;
1371
1372             if (!prob)
1373               fprintf (f, "%*s op%i is compile time invariant\n",
1374                        indent + 2, "", i);
1375             else if (prob != REG_BR_PROB_BASE)
1376               fprintf (f, "%*s op%i change %f%% of time\n", indent + 2, "", i,
1377                        prob * 100.0 / REG_BR_PROB_BASE);
1378           }
1379       if (!edge->inline_failed)
1380         {
1381           fprintf (f, "%*sStack frame offset %i, callee self size %i,"
1382                    " callee size %i\n",
1383                    indent + 2, "",
1384                    (int) inline_summaries->get (callee)->stack_frame_offset,
1385                    (int) inline_summaries->get (callee)->estimated_self_stack_size,
1386                    (int) inline_summaries->get (callee)->estimated_stack_size);
1387           dump_inline_edge_summary (f, indent + 2, callee, info);
1388         }
1389     }
1390   for (edge = node->indirect_calls; edge; edge = edge->next_callee)
1391     {
1392       struct inline_edge_summary *es = inline_edge_summary (edge);
1393       fprintf (f, "%*sindirect call loop depth:%2i freq:%4i size:%2i"
1394                " time: %2i",
1395                indent, "",
1396                es->loop_depth,
1397                edge->frequency, es->call_stmt_size, es->call_stmt_time);
1398       if (es->predicate)
1399         {
1400           fprintf (f, "predicate: ");
1401           dump_predicate (f, info->conds, es->predicate);
1402         }
1403       else
1404         fprintf (f, "\n");
1405     }
1406 }
1407
1408
1409 void
1410 dump_inline_summary (FILE *f, struct cgraph_node *node)
1411 {
1412   if (node->definition)
1413     {
1414       struct inline_summary *s = inline_summaries->get (node);
1415       size_time_entry *e;
1416       int i;
1417       fprintf (f, "Inline summary for %s/%i", node->name (),
1418                node->order);
1419       if (DECL_DISREGARD_INLINE_LIMITS (node->decl))
1420         fprintf (f, " always_inline");
1421       if (s->inlinable)
1422         fprintf (f, " inlinable");
1423       if (s->contains_cilk_spawn)
1424         fprintf (f, " contains_cilk_spawn");
1425       fprintf (f, "\n  self time:       %i\n", s->self_time);
1426       fprintf (f, "  global time:     %i\n", s->time);
1427       fprintf (f, "  self size:       %i\n", s->self_size);
1428       fprintf (f, "  global size:     %i\n", s->size);
1429       fprintf (f, "  min size:       %i\n", s->min_size);
1430       fprintf (f, "  self stack:      %i\n",
1431                (int) s->estimated_self_stack_size);
1432       fprintf (f, "  global stack:    %i\n", (int) s->estimated_stack_size);
1433       if (s->growth)
1434         fprintf (f, "  estimated growth:%i\n", (int) s->growth);
1435       if (s->scc_no)
1436         fprintf (f, "  In SCC:          %i\n", (int) s->scc_no);
1437       for (i = 0; vec_safe_iterate (s->entry, i, &e); i++)
1438         {
1439           fprintf (f, "    size:%f, time:%f, predicate:",
1440                    (double) e->size / INLINE_SIZE_SCALE,
1441                    (double) e->time / INLINE_TIME_SCALE);
1442           dump_predicate (f, s->conds, &e->predicate);
1443         }
1444       if (s->loop_iterations)
1445         {
1446           fprintf (f, "  loop iterations:");
1447           dump_predicate (f, s->conds, s->loop_iterations);
1448         }
1449       if (s->loop_stride)
1450         {
1451           fprintf (f, "  loop stride:");
1452           dump_predicate (f, s->conds, s->loop_stride);
1453         }
1454       if (s->array_index)
1455         {
1456           fprintf (f, "  array index:");
1457           dump_predicate (f, s->conds, s->array_index);
1458         }
1459       fprintf (f, "  calls:\n");
1460       dump_inline_edge_summary (f, 4, node, s);
1461       fprintf (f, "\n");
1462     }
1463 }
1464
1465 DEBUG_FUNCTION void
1466 debug_inline_summary (struct cgraph_node *node)
1467 {
1468   dump_inline_summary (stderr, node);
1469 }
1470
1471 void
1472 dump_inline_summaries (FILE *f)
1473 {
1474   struct cgraph_node *node;
1475
1476   FOR_EACH_DEFINED_FUNCTION (node)
1477     if (!node->global.inlined_to)
1478       dump_inline_summary (f, node);
1479 }
1480
1481 /* Give initial reasons why inlining would fail on EDGE.  This gets either
1482    nullified or usually overwritten by more precise reasons later.  */
1483
1484 void
1485 initialize_inline_failed (struct cgraph_edge *e)
1486 {
1487   struct cgraph_node *callee = e->callee;
1488
1489   if (e->indirect_unknown_callee)
1490     e->inline_failed = CIF_INDIRECT_UNKNOWN_CALL;
1491   else if (!callee->definition)
1492     e->inline_failed = CIF_BODY_NOT_AVAILABLE;
1493   else if (callee->local.redefined_extern_inline)
1494     e->inline_failed = CIF_REDEFINED_EXTERN_INLINE;
1495   else if (e->call_stmt_cannot_inline_p)
1496     e->inline_failed = CIF_MISMATCHED_ARGUMENTS;
1497   else if (cfun && fn_contains_cilk_spawn_p (cfun))
1498     /* We can't inline if the function is spawing a function.  */
1499     e->inline_failed = CIF_FUNCTION_NOT_INLINABLE;
1500   else
1501     e->inline_failed = CIF_FUNCTION_NOT_CONSIDERED;
1502 }
1503
1504 /* Callback of walk_aliased_vdefs.  Flags that it has been invoked to the
1505    boolean variable pointed to by DATA.  */
1506
1507 static bool
1508 mark_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef ATTRIBUTE_UNUSED,
1509                void *data)
1510 {
1511   bool *b = (bool *) data;
1512   *b = true;
1513   return true;
1514 }
1515
1516 /* If OP refers to value of function parameter, return the corresponding
1517    parameter.  */
1518
1519 static tree
1520 unmodified_parm_1 (gimple *stmt, tree op)
1521 {
1522   /* SSA_NAME referring to parm default def?  */
1523   if (TREE_CODE (op) == SSA_NAME
1524       && SSA_NAME_IS_DEFAULT_DEF (op)
1525       && TREE_CODE (SSA_NAME_VAR (op)) == PARM_DECL)
1526     return SSA_NAME_VAR (op);
1527   /* Non-SSA parm reference?  */
1528   if (TREE_CODE (op) == PARM_DECL)
1529     {
1530       bool modified = false;
1531
1532       ao_ref refd;
1533       ao_ref_init (&refd, op);
1534       walk_aliased_vdefs (&refd, gimple_vuse (stmt), mark_modified, &modified,
1535                           NULL);
1536       if (!modified)
1537         return op;
1538     }
1539   return NULL_TREE;
1540 }
1541
1542 /* If OP refers to value of function parameter, return the corresponding
1543    parameter.  Also traverse chains of SSA register assignments.  */
1544
1545 static tree
1546 unmodified_parm (gimple *stmt, tree op)
1547 {
1548   tree res = unmodified_parm_1 (stmt, op);
1549   if (res)
1550     return res;
1551
1552   if (TREE_CODE (op) == SSA_NAME
1553       && !SSA_NAME_IS_DEFAULT_DEF (op)
1554       && gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1555     return unmodified_parm (SSA_NAME_DEF_STMT (op),
1556                             gimple_assign_rhs1 (SSA_NAME_DEF_STMT (op)));
1557   return NULL_TREE;
1558 }
1559
1560 /* If OP refers to a value of a function parameter or value loaded from an
1561    aggregate passed to a parameter (either by value or reference), return TRUE
1562    and store the number of the parameter to *INDEX_P and information whether
1563    and how it has been loaded from an aggregate into *AGGPOS.  INFO describes
1564    the function parameters, STMT is the statement in which OP is used or
1565    loaded.  */
1566
1567 static bool
1568 unmodified_parm_or_parm_agg_item (struct ipa_func_body_info *fbi,
1569                                   gimple *stmt, tree op, int *index_p,
1570                                   struct agg_position_info *aggpos)
1571 {
1572   tree res = unmodified_parm_1 (stmt, op);
1573
1574   gcc_checking_assert (aggpos);
1575   if (res)
1576     {
1577       *index_p = ipa_get_param_decl_index (fbi->info, res);
1578       if (*index_p < 0)
1579         return false;
1580       aggpos->agg_contents = false;
1581       aggpos->by_ref = false;
1582       return true;
1583     }
1584
1585   if (TREE_CODE (op) == SSA_NAME)
1586     {
1587       if (SSA_NAME_IS_DEFAULT_DEF (op)
1588           || !gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1589         return false;
1590       stmt = SSA_NAME_DEF_STMT (op);
1591       op = gimple_assign_rhs1 (stmt);
1592       if (!REFERENCE_CLASS_P (op))
1593         return unmodified_parm_or_parm_agg_item (fbi, stmt, op, index_p,
1594                                                  aggpos);
1595     }
1596
1597   aggpos->agg_contents = true;
1598   return ipa_load_from_parm_agg (fbi, fbi->info->descriptors,
1599                                  stmt, op, index_p, &aggpos->offset,
1600                                  NULL, &aggpos->by_ref);
1601 }
1602
1603 /* See if statement might disappear after inlining.
1604    0 - means not eliminated
1605    1 - half of statements goes away
1606    2 - for sure it is eliminated.
1607    We are not terribly sophisticated, basically looking for simple abstraction
1608    penalty wrappers.  */
1609
1610 static int
1611 eliminated_by_inlining_prob (gimple *stmt)
1612 {
1613   enum gimple_code code = gimple_code (stmt);
1614   enum tree_code rhs_code;
1615
1616   if (!optimize)
1617     return 0;
1618
1619   switch (code)
1620     {
1621     case GIMPLE_RETURN:
1622       return 2;
1623     case GIMPLE_ASSIGN:
1624       if (gimple_num_ops (stmt) != 2)
1625         return 0;
1626
1627       rhs_code = gimple_assign_rhs_code (stmt);
1628
1629       /* Casts of parameters, loads from parameters passed by reference
1630          and stores to return value or parameters are often free after
1631          inlining dua to SRA and further combining.
1632          Assume that half of statements goes away.  */
1633       if (CONVERT_EXPR_CODE_P (rhs_code)
1634           || rhs_code == VIEW_CONVERT_EXPR
1635           || rhs_code == ADDR_EXPR
1636           || gimple_assign_rhs_class (stmt) == GIMPLE_SINGLE_RHS)
1637         {
1638           tree rhs = gimple_assign_rhs1 (stmt);
1639           tree lhs = gimple_assign_lhs (stmt);
1640           tree inner_rhs = get_base_address (rhs);
1641           tree inner_lhs = get_base_address (lhs);
1642           bool rhs_free = false;
1643           bool lhs_free = false;
1644
1645           if (!inner_rhs)
1646             inner_rhs = rhs;
1647           if (!inner_lhs)
1648             inner_lhs = lhs;
1649
1650           /* Reads of parameter are expected to be free.  */
1651           if (unmodified_parm (stmt, inner_rhs))
1652             rhs_free = true;
1653           /* Match expressions of form &this->field. Those will most likely
1654              combine with something upstream after inlining.  */
1655           else if (TREE_CODE (inner_rhs) == ADDR_EXPR)
1656             {
1657               tree op = get_base_address (TREE_OPERAND (inner_rhs, 0));
1658               if (TREE_CODE (op) == PARM_DECL)
1659                 rhs_free = true;
1660               else if (TREE_CODE (op) == MEM_REF
1661                        && unmodified_parm (stmt, TREE_OPERAND (op, 0)))
1662                 rhs_free = true;
1663             }
1664
1665           /* When parameter is not SSA register because its address is taken
1666              and it is just copied into one, the statement will be completely
1667              free after inlining (we will copy propagate backward).   */
1668           if (rhs_free && is_gimple_reg (lhs))
1669             return 2;
1670
1671           /* Reads of parameters passed by reference
1672              expected to be free (i.e. optimized out after inlining).  */
1673           if (TREE_CODE (inner_rhs) == MEM_REF
1674               && unmodified_parm (stmt, TREE_OPERAND (inner_rhs, 0)))
1675             rhs_free = true;
1676
1677           /* Copying parameter passed by reference into gimple register is
1678              probably also going to copy propagate, but we can't be quite
1679              sure.  */
1680           if (rhs_free && is_gimple_reg (lhs))
1681             lhs_free = true;
1682
1683           /* Writes to parameters, parameters passed by value and return value
1684              (either dirrectly or passed via invisible reference) are free.
1685
1686              TODO: We ought to handle testcase like
1687              struct a {int a,b;};
1688              struct a
1689              retrurnsturct (void)
1690              {
1691              struct a a ={1,2};
1692              return a;
1693              }
1694
1695              This translate into:
1696
1697              retrurnsturct ()
1698              {
1699              int a$b;
1700              int a$a;
1701              struct a a;
1702              struct a D.2739;
1703
1704              <bb 2>:
1705              D.2739.a = 1;
1706              D.2739.b = 2;
1707              return D.2739;
1708
1709              }
1710              For that we either need to copy ipa-split logic detecting writes
1711              to return value.  */
1712           if (TREE_CODE (inner_lhs) == PARM_DECL
1713               || TREE_CODE (inner_lhs) == RESULT_DECL
1714               || (TREE_CODE (inner_lhs) == MEM_REF
1715                   && (unmodified_parm (stmt, TREE_OPERAND (inner_lhs, 0))
1716                       || (TREE_CODE (TREE_OPERAND (inner_lhs, 0)) == SSA_NAME
1717                           && SSA_NAME_VAR (TREE_OPERAND (inner_lhs, 0))
1718                           && TREE_CODE (SSA_NAME_VAR (TREE_OPERAND
1719                                                       (inner_lhs,
1720                                                        0))) == RESULT_DECL))))
1721             lhs_free = true;
1722           if (lhs_free
1723               && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
1724             rhs_free = true;
1725           if (lhs_free && rhs_free)
1726             return 1;
1727         }
1728       return 0;
1729     default:
1730       return 0;
1731     }
1732 }
1733
1734
1735 /* If BB ends by a conditional we can turn into predicates, attach corresponding
1736    predicates to the CFG edges.   */
1737
1738 static void
1739 set_cond_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1740                                    struct inline_summary *summary,
1741                                    basic_block bb)
1742 {
1743   gimple *last;
1744   tree op;
1745   int index;
1746   struct agg_position_info aggpos;
1747   enum tree_code code, inverted_code;
1748   edge e;
1749   edge_iterator ei;
1750   gimple *set_stmt;
1751   tree op2;
1752
1753   last = last_stmt (bb);
1754   if (!last || gimple_code (last) != GIMPLE_COND)
1755     return;
1756   if (!is_gimple_ip_invariant (gimple_cond_rhs (last)))
1757     return;
1758   op = gimple_cond_lhs (last);
1759   /* TODO: handle conditionals like
1760      var = op0 < 4;
1761      if (var != 0).  */
1762   if (unmodified_parm_or_parm_agg_item (fbi, last, op, &index, &aggpos))
1763     {
1764       code = gimple_cond_code (last);
1765       inverted_code = invert_tree_comparison (code, HONOR_NANS (op));
1766
1767       FOR_EACH_EDGE (e, ei, bb->succs)
1768         {
1769           enum tree_code this_code = (e->flags & EDGE_TRUE_VALUE
1770                                       ? code : inverted_code);
1771           /* invert_tree_comparison will return ERROR_MARK on FP
1772              comparsions that are not EQ/NE instead of returning proper
1773              unordered one.  Be sure it is not confused with NON_CONSTANT.  */
1774           if (this_code != ERROR_MARK)
1775             {
1776               struct predicate p = add_condition (summary, index, &aggpos,
1777                                                   this_code,
1778                                                   gimple_cond_rhs (last));
1779               e->aux = edge_predicate_pool.allocate ();
1780               *(struct predicate *) e->aux = p;
1781             }
1782         }
1783     }
1784
1785   if (TREE_CODE (op) != SSA_NAME)
1786     return;
1787   /* Special case
1788      if (builtin_constant_p (op))
1789      constant_code
1790      else
1791      nonconstant_code.
1792      Here we can predicate nonconstant_code.  We can't
1793      really handle constant_code since we have no predicate
1794      for this and also the constant code is not known to be
1795      optimized away when inliner doen't see operand is constant.
1796      Other optimizers might think otherwise.  */
1797   if (gimple_cond_code (last) != NE_EXPR
1798       || !integer_zerop (gimple_cond_rhs (last)))
1799     return;
1800   set_stmt = SSA_NAME_DEF_STMT (op);
1801   if (!gimple_call_builtin_p (set_stmt, BUILT_IN_CONSTANT_P)
1802       || gimple_call_num_args (set_stmt) != 1)
1803     return;
1804   op2 = gimple_call_arg (set_stmt, 0);
1805   if (!unmodified_parm_or_parm_agg_item (fbi, set_stmt, op2, &index, &aggpos))
1806     return;
1807   FOR_EACH_EDGE (e, ei, bb->succs) if (e->flags & EDGE_FALSE_VALUE)
1808     {
1809       struct predicate p = add_condition (summary, index, &aggpos,
1810                                           IS_NOT_CONSTANT, NULL_TREE);
1811       e->aux = edge_predicate_pool.allocate ();
1812       *(struct predicate *) e->aux = p;
1813     }
1814 }
1815
1816
1817 /* If BB ends by a switch we can turn into predicates, attach corresponding
1818    predicates to the CFG edges.   */
1819
1820 static void
1821 set_switch_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1822                                      struct inline_summary *summary,
1823                                      basic_block bb)
1824 {
1825   gimple *lastg;
1826   tree op;
1827   int index;
1828   struct agg_position_info aggpos;
1829   edge e;
1830   edge_iterator ei;
1831   size_t n;
1832   size_t case_idx;
1833
1834   lastg = last_stmt (bb);
1835   if (!lastg || gimple_code (lastg) != GIMPLE_SWITCH)
1836     return;
1837   gswitch *last = as_a <gswitch *> (lastg);
1838   op = gimple_switch_index (last);
1839   if (!unmodified_parm_or_parm_agg_item (fbi, last, op, &index, &aggpos))
1840     return;
1841
1842   FOR_EACH_EDGE (e, ei, bb->succs)
1843     {
1844       e->aux = edge_predicate_pool.allocate ();
1845       *(struct predicate *) e->aux = false_predicate ();
1846     }
1847   n = gimple_switch_num_labels (last);
1848   for (case_idx = 0; case_idx < n; ++case_idx)
1849     {
1850       tree cl = gimple_switch_label (last, case_idx);
1851       tree min, max;
1852       struct predicate p;
1853
1854       e = find_edge (bb, label_to_block (CASE_LABEL (cl)));
1855       min = CASE_LOW (cl);
1856       max = CASE_HIGH (cl);
1857
1858       /* For default we might want to construct predicate that none
1859          of cases is met, but it is bit hard to do not having negations
1860          of conditionals handy.  */
1861       if (!min && !max)
1862         p = true_predicate ();
1863       else if (!max)
1864         p = add_condition (summary, index, &aggpos, EQ_EXPR, min);
1865       else
1866         {
1867           struct predicate p1, p2;
1868           p1 = add_condition (summary, index, &aggpos, GE_EXPR, min);
1869           p2 = add_condition (summary, index, &aggpos, LE_EXPR, max);
1870           p = and_predicates (summary->conds, &p1, &p2);
1871         }
1872       *(struct predicate *) e->aux
1873         = or_predicates (summary->conds, &p, (struct predicate *) e->aux);
1874     }
1875 }
1876
1877
1878 /* For each BB in NODE attach to its AUX pointer predicate under
1879    which it is executable.  */
1880
1881 static void
1882 compute_bb_predicates (struct ipa_func_body_info *fbi,
1883                        struct cgraph_node *node,
1884                        struct inline_summary *summary)
1885 {
1886   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
1887   bool done = false;
1888   basic_block bb;
1889
1890   FOR_EACH_BB_FN (bb, my_function)
1891     {
1892       set_cond_stmt_execution_predicate (fbi, summary, bb);
1893       set_switch_stmt_execution_predicate (fbi, summary, bb);
1894     }
1895
1896   /* Entry block is always executable.  */
1897   ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux
1898     = edge_predicate_pool.allocate ();
1899   *(struct predicate *) ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux
1900     = true_predicate ();
1901
1902   /* A simple dataflow propagation of predicates forward in the CFG.
1903      TODO: work in reverse postorder.  */
1904   while (!done)
1905     {
1906       done = true;
1907       FOR_EACH_BB_FN (bb, my_function)
1908         {
1909           struct predicate p = false_predicate ();
1910           edge e;
1911           edge_iterator ei;
1912           FOR_EACH_EDGE (e, ei, bb->preds)
1913             {
1914               if (e->src->aux)
1915                 {
1916                   struct predicate this_bb_predicate
1917                     = *(struct predicate *) e->src->aux;
1918                   if (e->aux)
1919                     this_bb_predicate
1920                       = and_predicates (summary->conds, &this_bb_predicate,
1921                                         (struct predicate *) e->aux);
1922                   p = or_predicates (summary->conds, &p, &this_bb_predicate);
1923                   if (true_predicate_p (&p))
1924                     break;
1925                 }
1926             }
1927           if (false_predicate_p (&p))
1928             gcc_assert (!bb->aux);
1929           else
1930             {
1931               if (!bb->aux)
1932                 {
1933                   done = false;
1934                   bb->aux = edge_predicate_pool.allocate ();
1935                   *((struct predicate *) bb->aux) = p;
1936                 }
1937               else if (!predicates_equal_p (&p, (struct predicate *) bb->aux))
1938                 {
1939                   /* This OR operation is needed to ensure monotonous data flow
1940                      in the case we hit the limit on number of clauses and the
1941                      and/or operations above give approximate answers.  */
1942                   p = or_predicates (summary->conds, &p, (struct predicate *)bb->aux);
1943                   if (!predicates_equal_p (&p, (struct predicate *) bb->aux))
1944                     {
1945                       done = false;
1946                       *((struct predicate *) bb->aux) = p;
1947                     }
1948                 }
1949             }
1950         }
1951     }
1952 }
1953
1954
1955 /* We keep info about constantness of SSA names.  */
1956
1957 typedef struct predicate predicate_t;
1958 /* Return predicate specifying when the STMT might have result that is not
1959    a compile time constant.  */
1960
1961 static struct predicate
1962 will_be_nonconstant_expr_predicate (struct ipa_node_params *info,
1963                                     struct inline_summary *summary,
1964                                     tree expr,
1965                                     vec<predicate_t> nonconstant_names)
1966 {
1967   tree parm;
1968   int index;
1969
1970   while (UNARY_CLASS_P (expr))
1971     expr = TREE_OPERAND (expr, 0);
1972
1973   parm = unmodified_parm (NULL, expr);
1974   if (parm && (index = ipa_get_param_decl_index (info, parm)) >= 0)
1975     return add_condition (summary, index, NULL, CHANGED, NULL_TREE);
1976   if (is_gimple_min_invariant (expr))
1977     return false_predicate ();
1978   if (TREE_CODE (expr) == SSA_NAME)
1979     return nonconstant_names[SSA_NAME_VERSION (expr)];
1980   if (BINARY_CLASS_P (expr) || COMPARISON_CLASS_P (expr))
1981     {
1982       struct predicate p1 = will_be_nonconstant_expr_predicate
1983         (info, summary, TREE_OPERAND (expr, 0),
1984          nonconstant_names);
1985       struct predicate p2;
1986       if (true_predicate_p (&p1))
1987         return p1;
1988       p2 = will_be_nonconstant_expr_predicate (info, summary,
1989                                                TREE_OPERAND (expr, 1),
1990                                                nonconstant_names);
1991       return or_predicates (summary->conds, &p1, &p2);
1992     }
1993   else if (TREE_CODE (expr) == COND_EXPR)
1994     {
1995       struct predicate p1 = will_be_nonconstant_expr_predicate
1996         (info, summary, TREE_OPERAND (expr, 0),
1997          nonconstant_names);
1998       struct predicate p2;
1999       if (true_predicate_p (&p1))
2000         return p1;
2001       p2 = will_be_nonconstant_expr_predicate (info, summary,
2002                                                TREE_OPERAND (expr, 1),
2003                                                nonconstant_names);
2004       if (true_predicate_p (&p2))
2005         return p2;
2006       p1 = or_predicates (summary->conds, &p1, &p2);
2007       p2 = will_be_nonconstant_expr_predicate (info, summary,
2008                                                TREE_OPERAND (expr, 2),
2009                                                nonconstant_names);
2010       return or_predicates (summary->conds, &p1, &p2);
2011     }
2012   else
2013     {
2014       debug_tree (expr);
2015       gcc_unreachable ();
2016     }
2017   return false_predicate ();
2018 }
2019
2020
2021 /* Return predicate specifying when the STMT might have result that is not
2022    a compile time constant.  */
2023
2024 static struct predicate
2025 will_be_nonconstant_predicate (struct ipa_func_body_info *fbi,
2026                                struct inline_summary *summary,
2027                                gimple *stmt,
2028                                vec<predicate_t> nonconstant_names)
2029 {
2030   struct predicate p = true_predicate ();
2031   ssa_op_iter iter;
2032   tree use;
2033   struct predicate op_non_const;
2034   bool is_load;
2035   int base_index;
2036   struct agg_position_info aggpos;
2037
2038   /* What statments might be optimized away
2039      when their arguments are constant.  */
2040   if (gimple_code (stmt) != GIMPLE_ASSIGN
2041       && gimple_code (stmt) != GIMPLE_COND
2042       && gimple_code (stmt) != GIMPLE_SWITCH
2043       && (gimple_code (stmt) != GIMPLE_CALL
2044           || !(gimple_call_flags (stmt) & ECF_CONST)))
2045     return p;
2046
2047   /* Stores will stay anyway.  */
2048   if (gimple_store_p (stmt))
2049     return p;
2050
2051   is_load = gimple_assign_load_p (stmt);
2052
2053   /* Loads can be optimized when the value is known.  */
2054   if (is_load)
2055     {
2056       tree op;
2057       gcc_assert (gimple_assign_single_p (stmt));
2058       op = gimple_assign_rhs1 (stmt);
2059       if (!unmodified_parm_or_parm_agg_item (fbi, stmt, op, &base_index,
2060                                              &aggpos))
2061         return p;
2062     }
2063   else
2064     base_index = -1;
2065
2066   /* See if we understand all operands before we start
2067      adding conditionals.  */
2068   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2069     {
2070       tree parm = unmodified_parm (stmt, use);
2071       /* For arguments we can build a condition.  */
2072       if (parm && ipa_get_param_decl_index (fbi->info, parm) >= 0)
2073         continue;
2074       if (TREE_CODE (use) != SSA_NAME)
2075         return p;
2076       /* If we know when operand is constant,
2077          we still can say something useful.  */
2078       if (!true_predicate_p (&nonconstant_names[SSA_NAME_VERSION (use)]))
2079         continue;
2080       return p;
2081     }
2082
2083   if (is_load)
2084     op_non_const =
2085       add_condition (summary, base_index, &aggpos, CHANGED, NULL);
2086   else
2087     op_non_const = false_predicate ();
2088   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2089     {
2090       tree parm = unmodified_parm (stmt, use);
2091       int index;
2092
2093       if (parm && (index = ipa_get_param_decl_index (fbi->info, parm)) >= 0)
2094         {
2095           if (index != base_index)
2096             p = add_condition (summary, index, NULL, CHANGED, NULL_TREE);
2097           else
2098             continue;
2099         }
2100       else
2101         p = nonconstant_names[SSA_NAME_VERSION (use)];
2102       op_non_const = or_predicates (summary->conds, &p, &op_non_const);
2103     }
2104   if ((gimple_code (stmt) == GIMPLE_ASSIGN || gimple_code (stmt) == GIMPLE_CALL)
2105       && gimple_op (stmt, 0)
2106       && TREE_CODE (gimple_op (stmt, 0)) == SSA_NAME)
2107     nonconstant_names[SSA_NAME_VERSION (gimple_op (stmt, 0))]
2108       = op_non_const;
2109   return op_non_const;
2110 }
2111
2112 struct record_modified_bb_info
2113 {
2114   bitmap bb_set;
2115   gimple *stmt;
2116 };
2117
2118 /* Callback of walk_aliased_vdefs.  Records basic blocks where the value may be
2119    set except for info->stmt.  */
2120
2121 static bool
2122 record_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef, void *data)
2123 {
2124   struct record_modified_bb_info *info =
2125     (struct record_modified_bb_info *) data;
2126   if (SSA_NAME_DEF_STMT (vdef) == info->stmt)
2127     return false;
2128   bitmap_set_bit (info->bb_set,
2129                   SSA_NAME_IS_DEFAULT_DEF (vdef)
2130                   ? ENTRY_BLOCK_PTR_FOR_FN (cfun)->index
2131                   : gimple_bb (SSA_NAME_DEF_STMT (vdef))->index);
2132   return false;
2133 }
2134
2135 /* Return probability (based on REG_BR_PROB_BASE) that I-th parameter of STMT
2136    will change since last invocation of STMT.
2137
2138    Value 0 is reserved for compile time invariants.
2139    For common parameters it is REG_BR_PROB_BASE.  For loop invariants it
2140    ought to be REG_BR_PROB_BASE / estimated_iters.  */
2141
2142 static int
2143 param_change_prob (gimple *stmt, int i)
2144 {
2145   tree op = gimple_call_arg (stmt, i);
2146   basic_block bb = gimple_bb (stmt);
2147   tree base;
2148
2149   /* Global invariants neve change.  */
2150   if (is_gimple_min_invariant (op))
2151     return 0;
2152   /* We would have to do non-trivial analysis to really work out what
2153      is the probability of value to change (i.e. when init statement
2154      is in a sibling loop of the call).
2155
2156      We do an conservative estimate: when call is executed N times more often
2157      than the statement defining value, we take the frequency 1/N.  */
2158   if (TREE_CODE (op) == SSA_NAME)
2159     {
2160       int init_freq;
2161
2162       if (!bb->frequency)
2163         return REG_BR_PROB_BASE;
2164
2165       if (SSA_NAME_IS_DEFAULT_DEF (op))
2166         init_freq = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
2167       else
2168         init_freq = gimple_bb (SSA_NAME_DEF_STMT (op))->frequency;
2169
2170       if (!init_freq)
2171         init_freq = 1;
2172       if (init_freq < bb->frequency)
2173         return MAX (GCOV_COMPUTE_SCALE (init_freq, bb->frequency), 1);
2174       else
2175         return REG_BR_PROB_BASE;
2176     }
2177
2178   base = get_base_address (op);
2179   if (base)
2180     {
2181       ao_ref refd;
2182       int max;
2183       struct record_modified_bb_info info;
2184       bitmap_iterator bi;
2185       unsigned index;
2186       tree init = ctor_for_folding (base);
2187
2188       if (init != error_mark_node)
2189         return 0;
2190       if (!bb->frequency)
2191         return REG_BR_PROB_BASE;
2192       ao_ref_init (&refd, op);
2193       info.stmt = stmt;
2194       info.bb_set = BITMAP_ALLOC (NULL);
2195       walk_aliased_vdefs (&refd, gimple_vuse (stmt), record_modified, &info,
2196                           NULL);
2197       if (bitmap_bit_p (info.bb_set, bb->index))
2198         {
2199           BITMAP_FREE (info.bb_set);
2200           return REG_BR_PROB_BASE;
2201         }
2202
2203       /* Assume that every memory is initialized at entry.
2204          TODO: Can we easilly determine if value is always defined
2205          and thus we may skip entry block?  */
2206       if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency)
2207         max = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
2208       else
2209         max = 1;
2210
2211       EXECUTE_IF_SET_IN_BITMAP (info.bb_set, 0, index, bi)
2212         max = MIN (max, BASIC_BLOCK_FOR_FN (cfun, index)->frequency);
2213
2214       BITMAP_FREE (info.bb_set);
2215       if (max < bb->frequency)
2216         return MAX (GCOV_COMPUTE_SCALE (max, bb->frequency), 1);
2217       else
2218         return REG_BR_PROB_BASE;
2219     }
2220   return REG_BR_PROB_BASE;
2221 }
2222
2223 /* Find whether a basic block BB is the final block of a (half) diamond CFG
2224    sub-graph and if the predicate the condition depends on is known.  If so,
2225    return true and store the pointer the predicate in *P.  */
2226
2227 static bool
2228 phi_result_unknown_predicate (struct ipa_node_params *info,
2229                               inline_summary *summary, basic_block bb,
2230                               struct predicate *p,
2231                               vec<predicate_t> nonconstant_names)
2232 {
2233   edge e;
2234   edge_iterator ei;
2235   basic_block first_bb = NULL;
2236   gimple *stmt;
2237
2238   if (single_pred_p (bb))
2239     {
2240       *p = false_predicate ();
2241       return true;
2242     }
2243
2244   FOR_EACH_EDGE (e, ei, bb->preds)
2245     {
2246       if (single_succ_p (e->src))
2247         {
2248           if (!single_pred_p (e->src))
2249             return false;
2250           if (!first_bb)
2251             first_bb = single_pred (e->src);
2252           else if (single_pred (e->src) != first_bb)
2253             return false;
2254         }
2255       else
2256         {
2257           if (!first_bb)
2258             first_bb = e->src;
2259           else if (e->src != first_bb)
2260             return false;
2261         }
2262     }
2263
2264   if (!first_bb)
2265     return false;
2266
2267   stmt = last_stmt (first_bb);
2268   if (!stmt
2269       || gimple_code (stmt) != GIMPLE_COND
2270       || !is_gimple_ip_invariant (gimple_cond_rhs (stmt)))
2271     return false;
2272
2273   *p = will_be_nonconstant_expr_predicate (info, summary,
2274                                            gimple_cond_lhs (stmt),
2275                                            nonconstant_names);
2276   if (true_predicate_p (p))
2277     return false;
2278   else
2279     return true;
2280 }
2281
2282 /* Given a PHI statement in a function described by inline properties SUMMARY
2283    and *P being the predicate describing whether the selected PHI argument is
2284    known, store a predicate for the result of the PHI statement into
2285    NONCONSTANT_NAMES, if possible.  */
2286
2287 static void
2288 predicate_for_phi_result (struct inline_summary *summary, gphi *phi,
2289                           struct predicate *p,
2290                           vec<predicate_t> nonconstant_names)
2291 {
2292   unsigned i;
2293
2294   for (i = 0; i < gimple_phi_num_args (phi); i++)
2295     {
2296       tree arg = gimple_phi_arg (phi, i)->def;
2297       if (!is_gimple_min_invariant (arg))
2298         {
2299           gcc_assert (TREE_CODE (arg) == SSA_NAME);
2300           *p = or_predicates (summary->conds, p,
2301                               &nonconstant_names[SSA_NAME_VERSION (arg)]);
2302           if (true_predicate_p (p))
2303             return;
2304         }
2305     }
2306
2307   if (dump_file && (dump_flags & TDF_DETAILS))
2308     {
2309       fprintf (dump_file, "\t\tphi predicate: ");
2310       dump_predicate (dump_file, summary->conds, p);
2311     }
2312   nonconstant_names[SSA_NAME_VERSION (gimple_phi_result (phi))] = *p;
2313 }
2314
2315 /* Return predicate specifying when array index in access OP becomes non-constant.  */
2316
2317 static struct predicate
2318 array_index_predicate (inline_summary *info,
2319                        vec< predicate_t> nonconstant_names, tree op)
2320 {
2321   struct predicate p = false_predicate ();
2322   while (handled_component_p (op))
2323     {
2324       if (TREE_CODE (op) == ARRAY_REF || TREE_CODE (op) == ARRAY_RANGE_REF)
2325         {
2326           if (TREE_CODE (TREE_OPERAND (op, 1)) == SSA_NAME)
2327             p = or_predicates (info->conds, &p,
2328                                &nonconstant_names[SSA_NAME_VERSION
2329                                                   (TREE_OPERAND (op, 1))]);
2330         }
2331       op = TREE_OPERAND (op, 0);
2332     }
2333   return p;
2334 }
2335
2336 /* For a typical usage of __builtin_expect (a<b, 1), we
2337    may introduce an extra relation stmt:
2338    With the builtin, we have
2339      t1 = a <= b;
2340      t2 = (long int) t1;
2341      t3 = __builtin_expect (t2, 1);
2342      if (t3 != 0)
2343        goto ...
2344    Without the builtin, we have
2345      if (a<=b)
2346        goto...
2347    This affects the size/time estimation and may have
2348    an impact on the earlier inlining.
2349    Here find this pattern and fix it up later.  */
2350
2351 static gimple *
2352 find_foldable_builtin_expect (basic_block bb)
2353 {
2354   gimple_stmt_iterator bsi;
2355
2356   for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
2357     {
2358       gimple *stmt = gsi_stmt (bsi);
2359       if (gimple_call_builtin_p (stmt, BUILT_IN_EXPECT)
2360           || (is_gimple_call (stmt)
2361               && gimple_call_internal_p (stmt)
2362               && gimple_call_internal_fn (stmt) == IFN_BUILTIN_EXPECT))
2363         {
2364           tree var = gimple_call_lhs (stmt);
2365           tree arg = gimple_call_arg (stmt, 0);
2366           use_operand_p use_p;
2367           gimple *use_stmt;
2368           bool match = false;
2369           bool done = false;
2370
2371           if (!var || !arg)
2372             continue;
2373           gcc_assert (TREE_CODE (var) == SSA_NAME);
2374
2375           while (TREE_CODE (arg) == SSA_NAME)
2376             {
2377               gimple *stmt_tmp = SSA_NAME_DEF_STMT (arg);
2378               if (!is_gimple_assign (stmt_tmp))
2379                 break;
2380               switch (gimple_assign_rhs_code (stmt_tmp))
2381                 {
2382                   case LT_EXPR:
2383                   case LE_EXPR:
2384                   case GT_EXPR:
2385                   case GE_EXPR:
2386                   case EQ_EXPR:
2387                   case NE_EXPR:
2388                     match = true;
2389                     done = true;
2390                     break;
2391                   CASE_CONVERT:
2392                     break;
2393                   default:
2394                     done = true;
2395                     break;
2396                 }
2397               if (done)
2398                 break;
2399               arg = gimple_assign_rhs1 (stmt_tmp);
2400             }
2401
2402           if (match && single_imm_use (var, &use_p, &use_stmt)
2403               && gimple_code (use_stmt) == GIMPLE_COND)
2404             return use_stmt;
2405         }
2406     }
2407   return NULL;
2408 }
2409
2410 /* Return true when the basic blocks contains only clobbers followed by RESX.
2411    Such BBs are kept around to make removal of dead stores possible with
2412    presence of EH and will be optimized out by optimize_clobbers later in the
2413    game.
2414
2415    NEED_EH is used to recurse in case the clobber has non-EH predecestors
2416    that can be clobber only, too.. When it is false, the RESX is not necessary
2417    on the end of basic block.  */
2418
2419 static bool
2420 clobber_only_eh_bb_p (basic_block bb, bool need_eh = true)
2421 {
2422   gimple_stmt_iterator gsi = gsi_last_bb (bb);
2423   edge_iterator ei;
2424   edge e;
2425
2426   if (need_eh)
2427     {
2428       if (gsi_end_p (gsi))
2429         return false;
2430       if (gimple_code (gsi_stmt (gsi)) != GIMPLE_RESX)
2431         return false;
2432       gsi_prev (&gsi);
2433     }
2434   else if (!single_succ_p (bb))
2435     return false;
2436
2437   for (; !gsi_end_p (gsi); gsi_prev (&gsi))
2438     {
2439       gimple *stmt = gsi_stmt (gsi);
2440       if (is_gimple_debug (stmt))
2441         continue;
2442       if (gimple_clobber_p (stmt))
2443         continue;
2444       if (gimple_code (stmt) == GIMPLE_LABEL)
2445         break;
2446       return false;
2447     }
2448
2449   /* See if all predecestors are either throws or clobber only BBs.  */
2450   FOR_EACH_EDGE (e, ei, bb->preds)
2451     if (!(e->flags & EDGE_EH)
2452         && !clobber_only_eh_bb_p (e->src, false))
2453       return false;
2454
2455   return true;
2456 }
2457
2458 /* Compute function body size parameters for NODE.
2459    When EARLY is true, we compute only simple summaries without
2460    non-trivial predicates to drive the early inliner.  */
2461
2462 static void
2463 estimate_function_body_sizes (struct cgraph_node *node, bool early)
2464 {
2465   gcov_type time = 0;
2466   /* Estimate static overhead for function prologue/epilogue and alignment. */
2467   int size = 2;
2468   /* Benefits are scaled by probability of elimination that is in range
2469      <0,2>.  */
2470   basic_block bb;
2471   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
2472   int freq;
2473   struct inline_summary *info = inline_summaries->get (node);
2474   struct predicate bb_predicate;
2475   struct ipa_func_body_info fbi;
2476   vec<predicate_t> nonconstant_names = vNULL;
2477   int nblocks, n;
2478   int *order;
2479   predicate array_index = true_predicate ();
2480   gimple *fix_builtin_expect_stmt;
2481
2482   gcc_assert (my_function && my_function->cfg);
2483   gcc_assert (cfun == my_function);
2484
2485   memset(&fbi, 0, sizeof(fbi));
2486   info->conds = NULL;
2487   info->entry = NULL;
2488
2489   /* When optimizing and analyzing for IPA inliner, initialize loop optimizer
2490      so we can produce proper inline hints.
2491
2492      When optimizing and analyzing for early inliner, initialize node params
2493      so we can produce correct BB predicates.  */
2494
2495   if (opt_for_fn (node->decl, optimize))
2496     {
2497       calculate_dominance_info (CDI_DOMINATORS);
2498       if (!early)
2499         loop_optimizer_init (LOOPS_NORMAL | LOOPS_HAVE_RECORDED_EXITS);
2500       else
2501         {
2502           ipa_check_create_node_params ();
2503           ipa_initialize_node_params (node);
2504         }
2505
2506       if (ipa_node_params_sum)
2507         {
2508           fbi.node = node;
2509           fbi.info = IPA_NODE_REF (node);
2510           fbi.bb_infos = vNULL;
2511           fbi.bb_infos.safe_grow_cleared (last_basic_block_for_fn (cfun));
2512           fbi.param_count = count_formal_params(node->decl);
2513           nonconstant_names.safe_grow_cleared
2514             (SSANAMES (my_function)->length ());
2515         }
2516     }
2517
2518   if (dump_file)
2519     fprintf (dump_file, "\nAnalyzing function body size: %s\n",
2520              node->name ());
2521
2522   /* When we run into maximal number of entries, we assign everything to the
2523      constant truth case.  Be sure to have it in list. */
2524   bb_predicate = true_predicate ();
2525   account_size_time (info, 0, 0, &bb_predicate);
2526
2527   bb_predicate = not_inlined_predicate ();
2528   account_size_time (info, 2 * INLINE_SIZE_SCALE, 0, &bb_predicate);
2529
2530   if (fbi.info)
2531     compute_bb_predicates (&fbi, node, info);
2532   order = XNEWVEC (int, n_basic_blocks_for_fn (cfun));
2533   nblocks = pre_and_rev_post_order_compute (NULL, order, false);
2534   for (n = 0; n < nblocks; n++)
2535     {
2536       bb = BASIC_BLOCK_FOR_FN (cfun, order[n]);
2537       freq = compute_call_stmt_bb_frequency (node->decl, bb);
2538       if (clobber_only_eh_bb_p (bb))
2539         {
2540           if (dump_file && (dump_flags & TDF_DETAILS))
2541             fprintf (dump_file, "\n Ignoring BB %i;"
2542                      " it will be optimized away by cleanup_clobbers\n",
2543                      bb->index);
2544           continue;
2545         }
2546
2547       /* TODO: Obviously predicates can be propagated down across CFG.  */
2548       if (fbi.info)
2549         {
2550           if (bb->aux)
2551             bb_predicate = *(struct predicate *) bb->aux;
2552           else
2553             bb_predicate = false_predicate ();
2554         }
2555       else
2556         bb_predicate = true_predicate ();
2557
2558       if (dump_file && (dump_flags & TDF_DETAILS))
2559         {
2560           fprintf (dump_file, "\n BB %i predicate:", bb->index);
2561           dump_predicate (dump_file, info->conds, &bb_predicate);
2562         }
2563
2564       if (fbi.info && nonconstant_names.exists ())
2565         {
2566           struct predicate phi_predicate;
2567           bool first_phi = true;
2568
2569           for (gphi_iterator bsi = gsi_start_phis (bb); !gsi_end_p (bsi);
2570                gsi_next (&bsi))
2571             {
2572               if (first_phi
2573                   && !phi_result_unknown_predicate (fbi.info, info, bb,
2574                                                     &phi_predicate,
2575                                                     nonconstant_names))
2576                 break;
2577               first_phi = false;
2578               if (dump_file && (dump_flags & TDF_DETAILS))
2579                 {
2580                   fprintf (dump_file, "  ");
2581                   print_gimple_stmt (dump_file, gsi_stmt (bsi), 0, 0);
2582                 }
2583               predicate_for_phi_result (info, bsi.phi (), &phi_predicate,
2584                                         nonconstant_names);
2585             }
2586         }
2587
2588       fix_builtin_expect_stmt = find_foldable_builtin_expect (bb);
2589
2590       for (gimple_stmt_iterator bsi = gsi_start_bb (bb); !gsi_end_p (bsi);
2591            gsi_next (&bsi))
2592         {
2593           gimple *stmt = gsi_stmt (bsi);
2594           int this_size = estimate_num_insns (stmt, &eni_size_weights);
2595           int this_time = estimate_num_insns (stmt, &eni_time_weights);
2596           int prob;
2597           struct predicate will_be_nonconstant;
2598
2599           /* This relation stmt should be folded after we remove
2600              buildin_expect call. Adjust the cost here.  */
2601           if (stmt == fix_builtin_expect_stmt)
2602             {
2603               this_size--;
2604               this_time--;
2605             }
2606
2607           if (dump_file && (dump_flags & TDF_DETAILS))
2608             {
2609               fprintf (dump_file, "  ");
2610               print_gimple_stmt (dump_file, stmt, 0, 0);
2611               fprintf (dump_file, "\t\tfreq:%3.2f size:%3i time:%3i\n",
2612                        ((double) freq) / CGRAPH_FREQ_BASE, this_size,
2613                        this_time);
2614             }
2615
2616           if (gimple_assign_load_p (stmt) && nonconstant_names.exists ())
2617             {
2618               struct predicate this_array_index;
2619               this_array_index =
2620                 array_index_predicate (info, nonconstant_names,
2621                                        gimple_assign_rhs1 (stmt));
2622               if (!false_predicate_p (&this_array_index))
2623                 array_index =
2624                   and_predicates (info->conds, &array_index,
2625                                   &this_array_index);
2626             }
2627           if (gimple_store_p (stmt) && nonconstant_names.exists ())
2628             {
2629               struct predicate this_array_index;
2630               this_array_index =
2631                 array_index_predicate (info, nonconstant_names,
2632                                        gimple_get_lhs (stmt));
2633               if (!false_predicate_p (&this_array_index))
2634                 array_index =
2635                   and_predicates (info->conds, &array_index,
2636                                   &this_array_index);
2637             }
2638
2639
2640           if (is_gimple_call (stmt)
2641               && !gimple_call_internal_p (stmt))
2642             {
2643               struct cgraph_edge *edge = node->get_edge (stmt);
2644               struct inline_edge_summary *es = inline_edge_summary (edge);
2645
2646               /* Special case: results of BUILT_IN_CONSTANT_P will be always
2647                  resolved as constant.  We however don't want to optimize
2648                  out the cgraph edges.  */
2649               if (nonconstant_names.exists ()
2650                   && gimple_call_builtin_p (stmt, BUILT_IN_CONSTANT_P)
2651                   && gimple_call_lhs (stmt)
2652                   && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
2653                 {
2654                   struct predicate false_p = false_predicate ();
2655                   nonconstant_names[SSA_NAME_VERSION (gimple_call_lhs (stmt))]
2656                     = false_p;
2657                 }
2658               if (ipa_node_params_sum)
2659                 {
2660                   int count = gimple_call_num_args (stmt);
2661                   int i;
2662
2663                   if (count)
2664                     es->param.safe_grow_cleared (count);
2665                   for (i = 0; i < count; i++)
2666                     {
2667                       int prob = param_change_prob (stmt, i);
2668                       gcc_assert (prob >= 0 && prob <= REG_BR_PROB_BASE);
2669                       es->param[i].change_prob = prob;
2670                     }
2671                 }
2672
2673               es->call_stmt_size = this_size;
2674               es->call_stmt_time = this_time;
2675               es->loop_depth = bb_loop_depth (bb);
2676               edge_set_predicate (edge, &bb_predicate);
2677             }
2678
2679           /* TODO: When conditional jump or swithc is known to be constant, but
2680              we did not translate it into the predicates, we really can account
2681              just maximum of the possible paths.  */
2682           if (fbi.info)
2683             will_be_nonconstant
2684               = will_be_nonconstant_predicate (&fbi, info,
2685                                                stmt, nonconstant_names);
2686           if (this_time || this_size)
2687             {
2688               struct predicate p;
2689
2690               this_time *= freq;
2691
2692               prob = eliminated_by_inlining_prob (stmt);
2693               if (prob == 1 && dump_file && (dump_flags & TDF_DETAILS))
2694                 fprintf (dump_file,
2695                          "\t\t50%% will be eliminated by inlining\n");
2696               if (prob == 2 && dump_file && (dump_flags & TDF_DETAILS))
2697                 fprintf (dump_file, "\t\tWill be eliminated by inlining\n");
2698
2699               if (fbi.info)
2700                 p = and_predicates (info->conds, &bb_predicate,
2701                                     &will_be_nonconstant);
2702               else
2703                 p = true_predicate ();
2704
2705               if (!false_predicate_p (&p)
2706                   || (is_gimple_call (stmt)
2707                       && !false_predicate_p (&bb_predicate)))
2708                 {
2709                   time += this_time;
2710                   size += this_size;
2711                   if (time > MAX_TIME * INLINE_TIME_SCALE)
2712                     time = MAX_TIME * INLINE_TIME_SCALE;
2713                 }
2714
2715               /* We account everything but the calls.  Calls have their own
2716                  size/time info attached to cgraph edges.  This is necessary
2717                  in order to make the cost disappear after inlining.  */
2718               if (!is_gimple_call (stmt))
2719                 {
2720                   if (prob)
2721                     {
2722                       struct predicate ip = not_inlined_predicate ();
2723                       ip = and_predicates (info->conds, &ip, &p);
2724                       account_size_time (info, this_size * prob,
2725                                          this_time * prob, &ip);
2726                     }
2727                   if (prob != 2)
2728                     account_size_time (info, this_size * (2 - prob),
2729                                        this_time * (2 - prob), &p);
2730                 }
2731
2732               gcc_assert (time >= 0);
2733               gcc_assert (size >= 0);
2734             }
2735         }
2736     }
2737   set_hint_predicate (&inline_summaries->get (node)->array_index, array_index);
2738   time = (time + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
2739   if (time > MAX_TIME)
2740     time = MAX_TIME;
2741   free (order);
2742
2743   if (nonconstant_names.exists () && !early)
2744     {
2745       struct loop *loop;
2746       predicate loop_iterations = true_predicate ();
2747       predicate loop_stride = true_predicate ();
2748
2749       if (dump_file && (dump_flags & TDF_DETAILS))
2750         flow_loops_dump (dump_file, NULL, 0);
2751       scev_initialize ();
2752       FOR_EACH_LOOP (loop, 0)
2753         {
2754           vec<edge> exits;
2755           edge ex;
2756           unsigned int j;
2757           struct tree_niter_desc niter_desc;
2758           bb_predicate = *(struct predicate *) loop->header->aux;
2759
2760           exits = get_loop_exit_edges (loop);
2761           FOR_EACH_VEC_ELT (exits, j, ex)
2762             if (number_of_iterations_exit (loop, ex, &niter_desc, false)
2763                 && !is_gimple_min_invariant (niter_desc.niter))
2764             {
2765               predicate will_be_nonconstant
2766                 = will_be_nonconstant_expr_predicate (fbi.info, info,
2767                                                       niter_desc.niter,
2768                                                       nonconstant_names);
2769               if (!true_predicate_p (&will_be_nonconstant))
2770                 will_be_nonconstant = and_predicates (info->conds,
2771                                                       &bb_predicate,
2772                                                       &will_be_nonconstant);
2773               if (!true_predicate_p (&will_be_nonconstant)
2774                   && !false_predicate_p (&will_be_nonconstant))
2775                 /* This is slightly inprecise.  We may want to represent each
2776                    loop with independent predicate.  */
2777                 loop_iterations =
2778                   and_predicates (info->conds, &loop_iterations,
2779                                   &will_be_nonconstant);
2780             }
2781           exits.release ();
2782         }
2783
2784       /* To avoid quadratic behavior we analyze stride predicates only
2785          with respect to the containing loop.  Thus we simply iterate
2786          over all defs in the outermost loop body.  */
2787       for (loop = loops_for_fn (cfun)->tree_root->inner;
2788            loop != NULL; loop = loop->next)
2789         {
2790           basic_block *body = get_loop_body (loop);
2791           for (unsigned i = 0; i < loop->num_nodes; i++)
2792             {
2793               gimple_stmt_iterator gsi;
2794               bb_predicate = *(struct predicate *) body[i]->aux;
2795               for (gsi = gsi_start_bb (body[i]); !gsi_end_p (gsi);
2796                    gsi_next (&gsi))
2797                 {
2798                   gimple *stmt = gsi_stmt (gsi);
2799
2800                   if (!is_gimple_assign (stmt))
2801                     continue;
2802
2803                   tree def = gimple_assign_lhs (stmt);
2804                   if (TREE_CODE (def) != SSA_NAME)
2805                     continue;
2806
2807                   affine_iv iv;
2808                   if (!simple_iv (loop_containing_stmt (stmt),
2809                                   loop_containing_stmt (stmt),
2810                                   def, &iv, true)
2811                       || is_gimple_min_invariant (iv.step))
2812                     continue;
2813
2814                   predicate will_be_nonconstant
2815                     = will_be_nonconstant_expr_predicate (fbi.info, info,
2816                                                           iv.step,
2817                                                           nonconstant_names);
2818                   if (!true_predicate_p (&will_be_nonconstant))
2819                     will_be_nonconstant
2820                       = and_predicates (info->conds, &bb_predicate,
2821                                         &will_be_nonconstant);
2822                   if (!true_predicate_p (&will_be_nonconstant)
2823                       && !false_predicate_p (&will_be_nonconstant))
2824                     /* This is slightly inprecise.  We may want to represent
2825                        each loop with independent predicate.  */
2826                     loop_stride = and_predicates (info->conds, &loop_stride,
2827                                                   &will_be_nonconstant);
2828                 }
2829             }
2830           free (body);
2831         }
2832       set_hint_predicate (&inline_summaries->get (node)->loop_iterations,
2833                           loop_iterations);
2834       set_hint_predicate (&inline_summaries->get (node)->loop_stride,
2835                           loop_stride);
2836       scev_finalize ();
2837     }
2838   FOR_ALL_BB_FN (bb, my_function)
2839     {
2840       edge e;
2841       edge_iterator ei;
2842
2843       if (bb->aux)
2844         edge_predicate_pool.remove ((predicate *)bb->aux);
2845       bb->aux = NULL;
2846       FOR_EACH_EDGE (e, ei, bb->succs)
2847         {
2848           if (e->aux)
2849             edge_predicate_pool.remove ((predicate *) e->aux);
2850           e->aux = NULL;
2851         }
2852     }
2853   inline_summaries->get (node)->self_time = time;
2854   inline_summaries->get (node)->self_size = size;
2855   nonconstant_names.release ();
2856   ipa_release_body_info (&fbi);
2857   if (opt_for_fn (node->decl, optimize))
2858     {
2859       if (!early)
2860         loop_optimizer_finalize ();
2861       else if (!ipa_edge_args_vector)
2862         ipa_free_all_node_params ();
2863       free_dominance_info (CDI_DOMINATORS);
2864     }
2865   if (dump_file)
2866     {
2867       fprintf (dump_file, "\n");
2868       dump_inline_summary (dump_file, node);
2869     }
2870 }
2871
2872
2873 /* Compute parameters of functions used by inliner.
2874    EARLY is true when we compute parameters for the early inliner  */
2875
2876 void
2877 compute_inline_parameters (struct cgraph_node *node, bool early)
2878 {
2879   HOST_WIDE_INT self_stack_size;
2880   struct cgraph_edge *e;
2881   struct inline_summary *info;
2882
2883   gcc_assert (!node->global.inlined_to);
2884
2885   inline_summary_alloc ();
2886
2887   info = inline_summaries->get (node);
2888   reset_inline_summary (node, info);
2889
2890   /* FIXME: Thunks are inlinable, but tree-inline don't know how to do that.
2891      Once this happen, we will need to more curefully predict call
2892      statement size.  */
2893   if (node->thunk.thunk_p)
2894     {
2895       struct inline_edge_summary *es = inline_edge_summary (node->callees);
2896       struct predicate t = true_predicate ();
2897
2898       info->inlinable = 0;
2899       node->callees->call_stmt_cannot_inline_p = true;
2900       node->local.can_change_signature = false;
2901       es->call_stmt_time = 1;
2902       es->call_stmt_size = 1;
2903       account_size_time (info, 0, 0, &t);
2904       return;
2905     }
2906
2907   /* Even is_gimple_min_invariant rely on current_function_decl.  */
2908   push_cfun (DECL_STRUCT_FUNCTION (node->decl));
2909
2910   /* Estimate the stack size for the function if we're optimizing.  */
2911   self_stack_size = optimize ? estimated_stack_frame_size (node) : 0;
2912   info->estimated_self_stack_size = self_stack_size;
2913   info->estimated_stack_size = self_stack_size;
2914   info->stack_frame_offset = 0;
2915
2916   /* Can this function be inlined at all?  */
2917   if (!opt_for_fn (node->decl, optimize)
2918       && !lookup_attribute ("always_inline",
2919                             DECL_ATTRIBUTES (node->decl)))
2920     info->inlinable = false;
2921   else
2922     info->inlinable = tree_inlinable_function_p (node->decl);
2923
2924   info->contains_cilk_spawn = fn_contains_cilk_spawn_p (cfun);
2925
2926   /* Type attributes can use parameter indices to describe them.  */
2927   if (TYPE_ATTRIBUTES (TREE_TYPE (node->decl)))
2928     node->local.can_change_signature = false;
2929   else
2930     {
2931       /* Otherwise, inlinable functions always can change signature.  */
2932       if (info->inlinable)
2933         node->local.can_change_signature = true;
2934       else
2935         {
2936           /* Functions calling builtin_apply can not change signature.  */
2937           for (e = node->callees; e; e = e->next_callee)
2938             {
2939               tree cdecl = e->callee->decl;
2940               if (DECL_BUILT_IN (cdecl)
2941                   && DECL_BUILT_IN_CLASS (cdecl) == BUILT_IN_NORMAL
2942                   && (DECL_FUNCTION_CODE (cdecl) == BUILT_IN_APPLY_ARGS
2943                       || DECL_FUNCTION_CODE (cdecl) == BUILT_IN_VA_START))
2944                 break;
2945             }
2946           node->local.can_change_signature = !e;
2947         }
2948     }
2949   estimate_function_body_sizes (node, early);
2950
2951   for (e = node->callees; e; e = e->next_callee)
2952     if (e->callee->comdat_local_p ())
2953       break;
2954   node->calls_comdat_local = (e != NULL);
2955
2956   /* Inlining characteristics are maintained by the cgraph_mark_inline.  */
2957   info->time = info->self_time;
2958   info->size = info->self_size;
2959   info->stack_frame_offset = 0;
2960   info->estimated_stack_size = info->estimated_self_stack_size;
2961   if (flag_checking)
2962     {
2963       inline_update_overall_summary (node);
2964       gcc_assert (info->time == info->self_time
2965                   && info->size == info->self_size);
2966     }
2967
2968   pop_cfun ();
2969 }
2970
2971
2972 /* Compute parameters of functions used by inliner using
2973    current_function_decl.  */
2974
2975 static unsigned int
2976 compute_inline_parameters_for_current (void)
2977 {
2978   compute_inline_parameters (cgraph_node::get (current_function_decl), true);
2979   return 0;
2980 }
2981
2982 namespace {
2983
2984 const pass_data pass_data_inline_parameters =
2985 {
2986   GIMPLE_PASS, /* type */
2987   "inline_param", /* name */
2988   OPTGROUP_INLINE, /* optinfo_flags */
2989   TV_INLINE_PARAMETERS, /* tv_id */
2990   0, /* properties_required */
2991   0, /* properties_provided */
2992   0, /* properties_destroyed */
2993   0, /* todo_flags_start */
2994   0, /* todo_flags_finish */
2995 };
2996
2997 class pass_inline_parameters : public gimple_opt_pass
2998 {
2999 public:
3000   pass_inline_parameters (gcc::context *ctxt)
3001     : gimple_opt_pass (pass_data_inline_parameters, ctxt)
3002   {}
3003
3004   /* opt_pass methods: */
3005   opt_pass * clone () { return new pass_inline_parameters (m_ctxt); }
3006   virtual unsigned int execute (function *)
3007     {
3008       return compute_inline_parameters_for_current ();
3009     }
3010
3011 }; // class pass_inline_parameters
3012
3013 } // anon namespace
3014
3015 gimple_opt_pass *
3016 make_pass_inline_parameters (gcc::context *ctxt)
3017 {
3018   return new pass_inline_parameters (ctxt);
3019 }
3020
3021
3022 /* Estimate benefit devirtualizing indirect edge IE, provided KNOWN_VALS,
3023    KNOWN_CONTEXTS and KNOWN_AGGS.  */
3024
3025 static bool
3026 estimate_edge_devirt_benefit (struct cgraph_edge *ie,
3027                               int *size, int *time,
3028                               vec<tree> known_vals,
3029                               vec<ipa_polymorphic_call_context> known_contexts,
3030                               vec<ipa_agg_jump_function_p> known_aggs)
3031 {
3032   tree target;
3033   struct cgraph_node *callee;
3034   struct inline_summary *isummary;
3035   enum availability avail;
3036   bool speculative;
3037
3038   if (!known_vals.exists () && !known_contexts.exists ())
3039     return false;
3040   if (!opt_for_fn (ie->caller->decl, flag_indirect_inlining))
3041     return false;
3042
3043   target = ipa_get_indirect_edge_target (ie, known_vals, known_contexts,
3044                                          known_aggs, &speculative);
3045   if (!target || speculative)
3046     return false;
3047
3048   /* Account for difference in cost between indirect and direct calls.  */
3049   *size -= (eni_size_weights.indirect_call_cost - eni_size_weights.call_cost);
3050   *time -= (eni_time_weights.indirect_call_cost - eni_time_weights.call_cost);
3051   gcc_checking_assert (*time >= 0);
3052   gcc_checking_assert (*size >= 0);
3053
3054   callee = cgraph_node::get (target);
3055   if (!callee || !callee->definition)
3056     return false;
3057   callee = callee->function_symbol (&avail);
3058   if (avail < AVAIL_AVAILABLE)
3059     return false;
3060   isummary = inline_summaries->get (callee);
3061   return isummary->inlinable;
3062 }
3063
3064 /* Increase SIZE, MIN_SIZE (if non-NULL) and TIME for size and time needed to
3065    handle edge E with probability PROB.
3066    Set HINTS if edge may be devirtualized.
3067    KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS describe context of the call
3068    site.  */
3069
3070 static inline void
3071 estimate_edge_size_and_time (struct cgraph_edge *e, int *size, int *min_size,
3072                              int *time,
3073                              int prob,
3074                              vec<tree> known_vals,
3075                              vec<ipa_polymorphic_call_context> known_contexts,
3076                              vec<ipa_agg_jump_function_p> known_aggs,
3077                              inline_hints *hints)
3078 {
3079   struct inline_edge_summary *es = inline_edge_summary (e);
3080   int call_size = es->call_stmt_size;
3081   int call_time = es->call_stmt_time;
3082   int cur_size;
3083   if (!e->callee
3084       && estimate_edge_devirt_benefit (e, &call_size, &call_time,
3085                                        known_vals, known_contexts, known_aggs)
3086       && hints && e->maybe_hot_p ())
3087     *hints |= INLINE_HINT_indirect_call;
3088   cur_size = call_size * INLINE_SIZE_SCALE;
3089   *size += cur_size;
3090   if (min_size)
3091     *min_size += cur_size;
3092   *time += apply_probability ((gcov_type) call_time, prob)
3093     * e->frequency * (INLINE_TIME_SCALE / CGRAPH_FREQ_BASE);
3094   if (*time > MAX_TIME * INLINE_TIME_SCALE)
3095     *time = MAX_TIME * INLINE_TIME_SCALE;
3096 }
3097
3098
3099
3100 /* Increase SIZE, MIN_SIZE and TIME for size and time needed to handle all
3101    calls in NODE.  POSSIBLE_TRUTHS, KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS
3102    describe context of the call site.  */
3103
3104 static void
3105 estimate_calls_size_and_time (struct cgraph_node *node, int *size,
3106                               int *min_size, int *time,
3107                               inline_hints *hints,
3108                               clause_t possible_truths,
3109                               vec<tree> known_vals,
3110                               vec<ipa_polymorphic_call_context> known_contexts,
3111                               vec<ipa_agg_jump_function_p> known_aggs)
3112 {
3113   struct cgraph_edge *e;
3114   for (e = node->callees; e; e = e->next_callee)
3115     {
3116       if (inline_edge_summary_vec.length () <= (unsigned) e->uid)
3117         continue;
3118
3119       struct inline_edge_summary *es = inline_edge_summary (e);
3120
3121       /* Do not care about zero sized builtins.  */
3122       if (e->inline_failed && !es->call_stmt_size)
3123         {
3124           gcc_checking_assert (!es->call_stmt_time);
3125           continue;
3126         }
3127       if (!es->predicate
3128           || evaluate_predicate (es->predicate, possible_truths))
3129         {
3130           if (e->inline_failed)
3131             {
3132               /* Predicates of calls shall not use NOT_CHANGED codes,
3133                  sowe do not need to compute probabilities.  */
3134               estimate_edge_size_and_time (e, size,
3135                                            es->predicate ? NULL : min_size,
3136                                            time, REG_BR_PROB_BASE,
3137                                            known_vals, known_contexts,
3138                                            known_aggs, hints);
3139             }
3140           else
3141             estimate_calls_size_and_time (e->callee, size, min_size, time,
3142                                           hints,
3143                                           possible_truths,
3144                                           known_vals, known_contexts,
3145                                           known_aggs);
3146         }
3147     }
3148   for (e = node->indirect_calls; e; e = e->next_callee)
3149     {
3150       if (inline_edge_summary_vec.length () <= (unsigned) e->uid)
3151         continue;
3152
3153       struct inline_edge_summary *es = inline_edge_summary (e);
3154       if (!es->predicate
3155           || evaluate_predicate (es->predicate, possible_truths))
3156         estimate_edge_size_and_time (e, size,
3157                                      es->predicate ? NULL : min_size,
3158                                      time, REG_BR_PROB_BASE,
3159                                      known_vals, known_contexts, known_aggs,
3160                                      hints);
3161     }
3162 }
3163
3164
3165 /* Estimate size and time needed to execute NODE assuming
3166    POSSIBLE_TRUTHS clause, and KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS
3167    information about NODE's arguments.  If non-NULL use also probability
3168    information present in INLINE_PARAM_SUMMARY vector.
3169    Additionally detemine hints determined by the context.  Finally compute
3170    minimal size needed for the call that is independent on the call context and
3171    can be used for fast estimates.  Return the values in RET_SIZE,
3172    RET_MIN_SIZE, RET_TIME and RET_HINTS.  */
3173
3174 static void
3175 estimate_node_size_and_time (struct cgraph_node *node,
3176                              clause_t possible_truths,
3177                              vec<tree> known_vals,
3178                              vec<ipa_polymorphic_call_context> known_contexts,
3179                              vec<ipa_agg_jump_function_p> known_aggs,
3180                              int *ret_size, int *ret_min_size, int *ret_time,
3181                              inline_hints *ret_hints,
3182                              vec<inline_param_summary>
3183                              inline_param_summary)
3184 {
3185   struct inline_summary *info = inline_summaries->get (node);
3186   size_time_entry *e;
3187   int size = 0;
3188   int time = 0;
3189   int min_size = 0;
3190   inline_hints hints = 0;
3191   int i;
3192
3193   if (dump_file && (dump_flags & TDF_DETAILS))
3194     {
3195       bool found = false;
3196       fprintf (dump_file, "   Estimating body: %s/%i\n"
3197                "   Known to be false: ", node->name (),
3198                node->order);
3199
3200       for (i = predicate_not_inlined_condition;
3201            i < (predicate_first_dynamic_condition
3202                 + (int) vec_safe_length (info->conds)); i++)
3203         if (!(possible_truths & (1 << i)))
3204           {
3205             if (found)
3206               fprintf (dump_file, ", ");
3207             found = true;
3208             dump_condition (dump_file, info->conds, i);
3209           }
3210     }
3211
3212   for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
3213     if (evaluate_predicate (&e->predicate, possible_truths))
3214       {
3215         size += e->size;
3216         gcc_checking_assert (e->time >= 0);
3217         gcc_checking_assert (time >= 0);
3218         if (!inline_param_summary.exists ())
3219           time += e->time;
3220         else
3221           {
3222             int prob = predicate_probability (info->conds,
3223                                               &e->predicate,
3224                                               possible_truths,
3225                                               inline_param_summary);
3226             gcc_checking_assert (prob >= 0);
3227             gcc_checking_assert (prob <= REG_BR_PROB_BASE);
3228             time += apply_probability ((gcov_type) e->time, prob);
3229           }
3230         if (time > MAX_TIME * INLINE_TIME_SCALE)
3231           time = MAX_TIME * INLINE_TIME_SCALE;
3232         gcc_checking_assert (time >= 0);
3233
3234       }
3235   gcc_checking_assert (true_predicate_p (&(*info->entry)[0].predicate));
3236   min_size = (*info->entry)[0].size;
3237   gcc_checking_assert (size >= 0);
3238   gcc_checking_assert (time >= 0);
3239
3240   if (info->loop_iterations
3241       && !evaluate_predicate (info->loop_iterations, possible_truths))
3242     hints |= INLINE_HINT_loop_iterations;
3243   if (info->loop_stride
3244       && !evaluate_predicate (info->loop_stride, possible_truths))
3245     hints |= INLINE_HINT_loop_stride;
3246   if (info->array_index
3247       && !evaluate_predicate (info->array_index, possible_truths))
3248     hints |= INLINE_HINT_array_index;
3249   if (info->scc_no)
3250     hints |= INLINE_HINT_in_scc;
3251   if (DECL_DECLARED_INLINE_P (node->decl))
3252     hints |= INLINE_HINT_declared_inline;
3253
3254   estimate_calls_size_and_time (node, &size, &min_size, &time, &hints, possible_truths,
3255                                 known_vals, known_contexts, known_aggs);
3256   gcc_checking_assert (size >= 0);
3257   gcc_checking_assert (time >= 0);
3258   time = RDIV (time, INLINE_TIME_SCALE);
3259   size = RDIV (size, INLINE_SIZE_SCALE);
3260   min_size = RDIV (min_size, INLINE_SIZE_SCALE);
3261
3262   if (dump_file && (dump_flags & TDF_DETAILS))
3263     fprintf (dump_file, "\n   size:%i time:%i\n", (int) size, (int) time);
3264   if (ret_time)
3265     *ret_time = time;
3266   if (ret_size)
3267     *ret_size = size;
3268   if (ret_min_size)
3269     *ret_min_size = min_size;
3270   if (ret_hints)
3271     *ret_hints = hints;
3272   return;
3273 }
3274
3275
3276 /* Estimate size and time needed to execute callee of EDGE assuming that
3277    parameters known to be constant at caller of EDGE are propagated.
3278    KNOWN_VALS and KNOWN_CONTEXTS are vectors of assumed known constant values
3279    and types for parameters.  */
3280
3281 void
3282 estimate_ipcp_clone_size_and_time (struct cgraph_node *node,
3283                                    vec<tree> known_vals,
3284                                    vec<ipa_polymorphic_call_context>
3285                                    known_contexts,
3286                                    vec<ipa_agg_jump_function_p> known_aggs,
3287                                    int *ret_size, int *ret_time,
3288                                    inline_hints *hints)
3289 {
3290   clause_t clause;
3291
3292   clause = evaluate_conditions_for_known_args (node, false, known_vals,
3293                                                known_aggs);
3294   estimate_node_size_and_time (node, clause, known_vals, known_contexts,
3295                                known_aggs, ret_size, NULL, ret_time, hints, vNULL);
3296 }
3297
3298 /* Translate all conditions from callee representation into caller
3299    representation and symbolically evaluate predicate P into new predicate.
3300
3301    INFO is inline_summary of function we are adding predicate into, CALLEE_INFO
3302    is summary of function predicate P is from. OPERAND_MAP is array giving
3303    callee formal IDs the caller formal IDs. POSSSIBLE_TRUTHS is clausule of all
3304    callee conditions that may be true in caller context.  TOPLEV_PREDICATE is
3305    predicate under which callee is executed.  OFFSET_MAP is an array of of
3306    offsets that need to be added to conditions, negative offset means that
3307    conditions relying on values passed by reference have to be discarded
3308    because they might not be preserved (and should be considered offset zero
3309    for other purposes).  */
3310
3311 static struct predicate
3312 remap_predicate (struct inline_summary *info,
3313                  struct inline_summary *callee_info,
3314                  struct predicate *p,
3315                  vec<int> operand_map,
3316                  vec<int> offset_map,
3317                  clause_t possible_truths, struct predicate *toplev_predicate)
3318 {
3319   int i;
3320   struct predicate out = true_predicate ();
3321
3322   /* True predicate is easy.  */
3323   if (true_predicate_p (p))
3324     return *toplev_predicate;
3325   for (i = 0; p->clause[i]; i++)
3326     {
3327       clause_t clause = p->clause[i];
3328       int cond;
3329       struct predicate clause_predicate = false_predicate ();
3330
3331       gcc_assert (i < MAX_CLAUSES);
3332
3333       for (cond = 0; cond < NUM_CONDITIONS; cond++)
3334         /* Do we have condition we can't disprove?   */
3335         if (clause & possible_truths & (1 << cond))
3336           {
3337             struct predicate cond_predicate;
3338             /* Work out if the condition can translate to predicate in the
3339                inlined function.  */
3340             if (cond >= predicate_first_dynamic_condition)
3341               {
3342                 struct condition *c;
3343
3344                 c = &(*callee_info->conds)[cond
3345                                            -
3346                                            predicate_first_dynamic_condition];
3347                 /* See if we can remap condition operand to caller's operand.
3348                    Otherwise give up.  */
3349                 if (!operand_map.exists ()
3350                     || (int) operand_map.length () <= c->operand_num
3351                     || operand_map[c->operand_num] == -1
3352                     /* TODO: For non-aggregate conditions, adding an offset is
3353                        basically an arithmetic jump function processing which
3354                        we should support in future.  */
3355                     || ((!c->agg_contents || !c->by_ref)
3356                         && offset_map[c->operand_num] > 0)
3357                     || (c->agg_contents && c->by_ref
3358                         && offset_map[c->operand_num] < 0))
3359                   cond_predicate = true_predicate ();
3360                 else
3361                   {
3362                     struct agg_position_info ap;
3363                     HOST_WIDE_INT offset_delta = offset_map[c->operand_num];
3364                     if (offset_delta < 0)
3365                       {
3366                         gcc_checking_assert (!c->agg_contents || !c->by_ref);
3367                         offset_delta = 0;
3368                       }
3369                     gcc_assert (!c->agg_contents
3370                                 || c->by_ref || offset_delta == 0);
3371                     ap.offset = c->offset + offset_delta;
3372                     ap.agg_contents = c->agg_contents;
3373                     ap.by_ref = c->by_ref;
3374                     cond_predicate = add_condition (info,
3375                                                     operand_map[c->operand_num],
3376                                                     &ap, c->code, c->val);
3377                   }
3378               }
3379             /* Fixed conditions remains same, construct single
3380                condition predicate.  */
3381             else
3382               {
3383                 cond_predicate.clause[0] = 1 << cond;
3384                 cond_predicate.clause[1] = 0;
3385               }
3386             clause_predicate = or_predicates (info->conds, &clause_predicate,
3387                                               &cond_predicate);
3388           }
3389       out = and_predicates (info->conds, &out, &clause_predicate);
3390     }
3391   return and_predicates (info->conds, &out, toplev_predicate);
3392 }
3393
3394
3395 /* Update summary information of inline clones after inlining.
3396    Compute peak stack usage.  */
3397
3398 static void
3399 inline_update_callee_summaries (struct cgraph_node *node, int depth)
3400 {
3401   struct cgraph_edge *e;
3402   struct inline_summary *callee_info = inline_summaries->get (node);
3403   struct inline_summary *caller_info = inline_summaries->get (node->callers->caller);
3404   HOST_WIDE_INT peak;
3405
3406   callee_info->stack_frame_offset
3407     = caller_info->stack_frame_offset
3408     + caller_info->estimated_self_stack_size;
3409   peak = callee_info->stack_frame_offset
3410     + callee_info->estimated_self_stack_size;
3411   if (inline_summaries->get (node->global.inlined_to)->estimated_stack_size < peak)
3412       inline_summaries->get (node->global.inlined_to)->estimated_stack_size = peak;
3413   ipa_propagate_frequency (node);
3414   for (e = node->callees; e; e = e->next_callee)
3415     {
3416       if (!e->inline_failed)
3417         inline_update_callee_summaries (e->callee, depth);
3418       inline_edge_summary (e)->loop_depth += depth;
3419     }
3420   for (e = node->indirect_calls; e; e = e->next_callee)
3421     inline_edge_summary (e)->loop_depth += depth;
3422 }
3423
3424 /* Update change_prob of EDGE after INLINED_EDGE has been inlined.
3425    When functoin A is inlined in B and A calls C with parameter that
3426    changes with probability PROB1 and C is known to be passthroug
3427    of argument if B that change with probability PROB2, the probability
3428    of change is now PROB1*PROB2.  */
3429
3430 static void
3431 remap_edge_change_prob (struct cgraph_edge *inlined_edge,
3432                         struct cgraph_edge *edge)
3433 {
3434   if (ipa_node_params_sum)
3435     {
3436       int i;
3437       struct ipa_edge_args *args = IPA_EDGE_REF (edge);
3438       struct inline_edge_summary *es = inline_edge_summary (edge);
3439       struct inline_edge_summary *inlined_es
3440         = inline_edge_summary (inlined_edge);
3441
3442       for (i = 0; i < ipa_get_cs_argument_count (args); i++)
3443         {
3444           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3445           if (jfunc->type == IPA_JF_PASS_THROUGH
3446               && (ipa_get_jf_pass_through_formal_id (jfunc)
3447                   < (int) inlined_es->param.length ()))
3448             {
3449               int jf_formal_id = ipa_get_jf_pass_through_formal_id (jfunc);
3450               int prob1 = es->param[i].change_prob;
3451               int prob2 = inlined_es->param[jf_formal_id].change_prob;
3452               int prob = combine_probabilities (prob1, prob2);
3453
3454               if (prob1 && prob2 && !prob)
3455                 prob = 1;
3456
3457               es->param[i].change_prob = prob;
3458             }
3459         }
3460     }
3461 }
3462
3463 /* Update edge summaries of NODE after INLINED_EDGE has been inlined.
3464
3465    Remap predicates of callees of NODE.  Rest of arguments match
3466    remap_predicate.
3467
3468    Also update change probabilities.  */
3469
3470 static void
3471 remap_edge_summaries (struct cgraph_edge *inlined_edge,
3472                       struct cgraph_node *node,
3473                       struct inline_summary *info,
3474                       struct inline_summary *callee_info,
3475                       vec<int> operand_map,
3476                       vec<int> offset_map,
3477                       clause_t possible_truths,
3478                       struct predicate *toplev_predicate)
3479 {
3480   struct cgraph_edge *e, *next;
3481   for (e = node->callees; e; e = next)
3482     {
3483       struct inline_edge_summary *es = inline_edge_summary (e);
3484       struct predicate p;
3485       next = e->next_callee;
3486
3487       if (e->inline_failed)
3488         {
3489           remap_edge_change_prob (inlined_edge, e);
3490
3491           if (es->predicate)
3492             {
3493               p = remap_predicate (info, callee_info,
3494                                    es->predicate, operand_map, offset_map,
3495                                    possible_truths, toplev_predicate);
3496               edge_set_predicate (e, &p);
3497             }
3498           else
3499             edge_set_predicate (e, toplev_predicate);
3500         }
3501       else
3502         remap_edge_summaries (inlined_edge, e->callee, info, callee_info,
3503                               operand_map, offset_map, possible_truths,
3504                               toplev_predicate);
3505     }
3506   for (e = node->indirect_calls; e; e = next)
3507     {
3508       struct inline_edge_summary *es = inline_edge_summary (e);
3509       struct predicate p;
3510       next = e->next_callee;
3511
3512       remap_edge_change_prob (inlined_edge, e);
3513       if (es->predicate)
3514         {
3515           p = remap_predicate (info, callee_info,
3516                                es->predicate, operand_map, offset_map,
3517                                possible_truths, toplev_predicate);
3518           edge_set_predicate (e, &p);
3519         }
3520       else
3521         edge_set_predicate (e, toplev_predicate);
3522     }
3523 }
3524
3525 /* Same as remap_predicate, but set result into hint *HINT.  */
3526
3527 static void
3528 remap_hint_predicate (struct inline_summary *info,
3529                       struct inline_summary *callee_info,
3530                       struct predicate **hint,
3531                       vec<int> operand_map,
3532                       vec<int> offset_map,
3533                       clause_t possible_truths,
3534                       struct predicate *toplev_predicate)
3535 {
3536   predicate p;
3537
3538   if (!*hint)
3539     return;
3540   p = remap_predicate (info, callee_info,
3541                        *hint,
3542                        operand_map, offset_map,
3543                        possible_truths, toplev_predicate);
3544   if (!false_predicate_p (&p) && !true_predicate_p (&p))
3545     {
3546       if (!*hint)
3547         set_hint_predicate (hint, p);
3548       else
3549         **hint = and_predicates (info->conds, *hint, &p);
3550     }
3551 }
3552
3553 /* We inlined EDGE.  Update summary of the function we inlined into.  */
3554
3555 void
3556 inline_merge_summary (struct cgraph_edge *edge)
3557 {
3558   struct inline_summary *callee_info = inline_summaries->get (edge->callee);
3559   struct cgraph_node *to = (edge->caller->global.inlined_to
3560                             ? edge->caller->global.inlined_to : edge->caller);
3561   struct inline_summary *info = inline_summaries->get (to);
3562   clause_t clause = 0;          /* not_inline is known to be false.  */
3563   size_time_entry *e;
3564   vec<int> operand_map = vNULL;
3565   vec<int> offset_map = vNULL;
3566   int i;
3567   struct predicate toplev_predicate;
3568   struct predicate true_p = true_predicate ();
3569   struct inline_edge_summary *es = inline_edge_summary (edge);
3570
3571   if (es->predicate)
3572     toplev_predicate = *es->predicate;
3573   else
3574     toplev_predicate = true_predicate ();
3575
3576   if (callee_info->conds)
3577     evaluate_properties_for_edge (edge, true, &clause, NULL, NULL, NULL);
3578   if (ipa_node_params_sum && callee_info->conds)
3579     {
3580       struct ipa_edge_args *args = IPA_EDGE_REF (edge);
3581       int count = ipa_get_cs_argument_count (args);
3582       int i;
3583
3584       if (count)
3585         {
3586           operand_map.safe_grow_cleared (count);
3587           offset_map.safe_grow_cleared (count);
3588         }
3589       for (i = 0; i < count; i++)
3590         {
3591           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3592           int map = -1;
3593
3594           /* TODO: handle non-NOPs when merging.  */
3595           if (jfunc->type == IPA_JF_PASS_THROUGH)
3596             {
3597               if (ipa_get_jf_pass_through_operation (jfunc) == NOP_EXPR)
3598                 map = ipa_get_jf_pass_through_formal_id (jfunc);
3599               if (!ipa_get_jf_pass_through_agg_preserved (jfunc))
3600                 offset_map[i] = -1;
3601             }
3602           else if (jfunc->type == IPA_JF_ANCESTOR)
3603             {
3604               HOST_WIDE_INT offset = ipa_get_jf_ancestor_offset (jfunc);
3605               if (offset >= 0 && offset < INT_MAX)
3606                 {
3607                   map = ipa_get_jf_ancestor_formal_id (jfunc);
3608                   if (!ipa_get_jf_ancestor_agg_preserved (jfunc))
3609                     offset = -1;
3610                   offset_map[i] = offset;
3611                 }
3612             }
3613           operand_map[i] = map;
3614           gcc_assert (map < ipa_get_param_count (IPA_NODE_REF (to)));
3615         }
3616     }
3617   for (i = 0; vec_safe_iterate (callee_info->entry, i, &e); i++)
3618     {
3619       struct predicate p = remap_predicate (info, callee_info,
3620                                             &e->predicate, operand_map,
3621                                             offset_map, clause,
3622                                             &toplev_predicate);
3623       if (!false_predicate_p (&p))
3624         {
3625           gcov_type add_time = ((gcov_type) e->time * edge->frequency
3626                                 + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
3627           int prob = predicate_probability (callee_info->conds,
3628                                             &e->predicate,
3629                                             clause, es->param);
3630           add_time = apply_probability ((gcov_type) add_time, prob);
3631           if (add_time > MAX_TIME * INLINE_TIME_SCALE)
3632             add_time = MAX_TIME * INLINE_TIME_SCALE;
3633           if (prob != REG_BR_PROB_BASE
3634               && dump_file && (dump_flags & TDF_DETAILS))
3635             {
3636               fprintf (dump_file, "\t\tScaling time by probability:%f\n",
3637                        (double) prob / REG_BR_PROB_BASE);
3638             }
3639           account_size_time (info, e->size, add_time, &p);
3640         }
3641     }
3642   remap_edge_summaries (edge, edge->callee, info, callee_info, operand_map,
3643                         offset_map, clause, &toplev_predicate);
3644   remap_hint_predicate (info, callee_info,
3645                         &callee_info->loop_iterations,
3646                         operand_map, offset_map, clause, &toplev_predicate);
3647   remap_hint_predicate (info, callee_info,
3648                         &callee_info->loop_stride,
3649                         operand_map, offset_map, clause, &toplev_predicate);
3650   remap_hint_predicate (info, callee_info,
3651                         &callee_info->array_index,
3652                         operand_map, offset_map, clause, &toplev_predicate);
3653
3654   inline_update_callee_summaries (edge->callee,
3655                                   inline_edge_summary (edge)->loop_depth);
3656
3657   /* We do not maintain predicates of inlined edges, free it.  */
3658   edge_set_predicate (edge, &true_p);
3659   /* Similarly remove param summaries.  */
3660   es->param.release ();
3661   operand_map.release ();
3662   offset_map.release ();
3663 }
3664
3665 /* For performance reasons inline_merge_summary is not updating overall size
3666    and time.  Recompute it.  */
3667
3668 void
3669 inline_update_overall_summary (struct cgraph_node *node)
3670 {
3671   struct inline_summary *info = inline_summaries->get (node);
3672   size_time_entry *e;
3673   int i;
3674
3675   info->size = 0;
3676   info->time = 0;
3677   for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
3678     {
3679       info->size += e->size, info->time += e->time;
3680       if (info->time > MAX_TIME * INLINE_TIME_SCALE)
3681         info->time = MAX_TIME * INLINE_TIME_SCALE;
3682     }
3683   estimate_calls_size_and_time (node, &info->size, &info->min_size,
3684                                 &info->time, NULL,
3685                                 ~(clause_t) (1 << predicate_false_condition),
3686                                 vNULL, vNULL, vNULL);
3687   info->time = (info->time + INLINE_TIME_SCALE / 2) / INLINE_TIME_SCALE;
3688   info->size = (info->size + INLINE_SIZE_SCALE / 2) / INLINE_SIZE_SCALE;
3689 }
3690
3691 /* Return hints derrived from EDGE.   */
3692 int
3693 simple_edge_hints (struct cgraph_edge *edge)
3694 {
3695   int hints = 0;
3696   struct cgraph_node *to = (edge->caller->global.inlined_to
3697                             ? edge->caller->global.inlined_to : edge->caller);
3698   struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
3699   if (inline_summaries->get (to)->scc_no
3700       && inline_summaries->get (to)->scc_no
3701          == inline_summaries->get (callee)->scc_no
3702       && !edge->recursive_p ())
3703     hints |= INLINE_HINT_same_scc;
3704
3705   if (callee->lto_file_data && edge->caller->lto_file_data
3706       && edge->caller->lto_file_data != callee->lto_file_data
3707       && !callee->merged)
3708     hints |= INLINE_HINT_cross_module;
3709
3710   return hints;
3711 }
3712
3713 /* Estimate the time cost for the caller when inlining EDGE.
3714    Only to be called via estimate_edge_time, that handles the
3715    caching mechanism.
3716
3717    When caching, also update the cache entry.  Compute both time and
3718    size, since we always need both metrics eventually.  */
3719
3720 int
3721 do_estimate_edge_time (struct cgraph_edge *edge)
3722 {
3723   int time;
3724   int size;
3725   inline_hints hints;
3726   struct cgraph_node *callee;
3727   clause_t clause;
3728   vec<tree> known_vals;
3729   vec<ipa_polymorphic_call_context> known_contexts;
3730   vec<ipa_agg_jump_function_p> known_aggs;
3731   struct inline_edge_summary *es = inline_edge_summary (edge);
3732   int min_size;
3733
3734   callee = edge->callee->ultimate_alias_target ();
3735
3736   gcc_checking_assert (edge->inline_failed);
3737   evaluate_properties_for_edge (edge, true,
3738                                 &clause, &known_vals, &known_contexts,
3739                                 &known_aggs);
3740   estimate_node_size_and_time (callee, clause, known_vals, known_contexts,
3741                                known_aggs, &size, &min_size, &time, &hints, es->param);
3742
3743   /* When we have profile feedback, we can quite safely identify hot
3744      edges and for those we disable size limits.  Don't do that when
3745      probability that caller will call the callee is low however, since it
3746      may hurt optimization of the caller's hot path.  */
3747   if (edge->count && edge->maybe_hot_p ()
3748       && (edge->count * 2
3749           > (edge->caller->global.inlined_to
3750              ? edge->caller->global.inlined_to->count : edge->caller->count)))
3751     hints |= INLINE_HINT_known_hot;
3752
3753   known_vals.release ();
3754   known_contexts.release ();
3755   known_aggs.release ();
3756   gcc_checking_assert (size >= 0);
3757   gcc_checking_assert (time >= 0);
3758
3759   /* When caching, update the cache entry.  */
3760   if (edge_growth_cache.exists ())
3761     {
3762       inline_summaries->get (edge->callee)->min_size = min_size;
3763       if ((int) edge_growth_cache.length () <= edge->uid)
3764         edge_growth_cache.safe_grow_cleared (symtab->edges_max_uid);
3765       edge_growth_cache[edge->uid].time = time + (time >= 0);
3766
3767       edge_growth_cache[edge->uid].size = size + (size >= 0);
3768       hints |= simple_edge_hints (edge);
3769       edge_growth_cache[edge->uid].hints = hints + 1;
3770     }
3771   return time;
3772 }
3773
3774
3775 /* Return estimated callee growth after inlining EDGE.
3776    Only to be called via estimate_edge_size.  */
3777
3778 int
3779 do_estimate_edge_size (struct cgraph_edge *edge)
3780 {
3781   int size;
3782   struct cgraph_node *callee;
3783   clause_t clause;
3784   vec<tree> known_vals;
3785   vec<ipa_polymorphic_call_context> known_contexts;
3786   vec<ipa_agg_jump_function_p> known_aggs;
3787
3788   /* When we do caching, use do_estimate_edge_time to populate the entry.  */
3789
3790   if (edge_growth_cache.exists ())
3791     {
3792       do_estimate_edge_time (edge);
3793       size = edge_growth_cache[edge->uid].size;
3794       gcc_checking_assert (size);
3795       return size - (size > 0);
3796     }
3797
3798   callee = edge->callee->ultimate_alias_target ();
3799
3800   /* Early inliner runs without caching, go ahead and do the dirty work.  */
3801   gcc_checking_assert (edge->inline_failed);
3802   evaluate_properties_for_edge (edge, true,
3803                                 &clause, &known_vals, &known_contexts,
3804                                 &known_aggs);
3805   estimate_node_size_and_time (callee, clause, known_vals, known_contexts,
3806                                known_aggs, &size, NULL, NULL, NULL, vNULL);
3807   known_vals.release ();
3808   known_contexts.release ();
3809   known_aggs.release ();
3810   return size;
3811 }
3812
3813
3814 /* Estimate the growth of the caller when inlining EDGE.
3815    Only to be called via estimate_edge_size.  */
3816
3817 inline_hints
3818 do_estimate_edge_hints (struct cgraph_edge *edge)
3819 {
3820   inline_hints hints;
3821   struct cgraph_node *callee;
3822   clause_t clause;
3823   vec<tree> known_vals;
3824   vec<ipa_polymorphic_call_context> known_contexts;
3825   vec<ipa_agg_jump_function_p> known_aggs;
3826
3827   /* When we do caching, use do_estimate_edge_time to populate the entry.  */
3828
3829   if (edge_growth_cache.exists ())
3830     {
3831       do_estimate_edge_time (edge);
3832       hints = edge_growth_cache[edge->uid].hints;
3833       gcc_checking_assert (hints);
3834       return hints - 1;
3835     }
3836
3837   callee = edge->callee->ultimate_alias_target ();
3838
3839   /* Early inliner runs without caching, go ahead and do the dirty work.  */
3840   gcc_checking_assert (edge->inline_failed);
3841   evaluate_properties_for_edge (edge, true,
3842                                 &clause, &known_vals, &known_contexts,
3843                                 &known_aggs);
3844   estimate_node_size_and_time (callee, clause, known_vals, known_contexts,
3845                                known_aggs, NULL, NULL, NULL, &hints, vNULL);
3846   known_vals.release ();
3847   known_contexts.release ();
3848   known_aggs.release ();
3849   hints |= simple_edge_hints (edge);
3850   return hints;
3851 }
3852
3853
3854 /* Estimate self time of the function NODE after inlining EDGE.  */
3855
3856 int
3857 estimate_time_after_inlining (struct cgraph_node *node,
3858                               struct cgraph_edge *edge)
3859 {
3860   struct inline_edge_summary *es = inline_edge_summary (edge);
3861   if (!es->predicate || !false_predicate_p (es->predicate))
3862     {
3863       gcov_type time =
3864         inline_summaries->get (node)->time + estimate_edge_time (edge);
3865       if (time < 0)
3866         time = 0;
3867       if (time > MAX_TIME)
3868         time = MAX_TIME;
3869       return time;
3870     }
3871   return inline_summaries->get (node)->time;
3872 }
3873
3874
3875 /* Estimate the size of NODE after inlining EDGE which should be an
3876    edge to either NODE or a call inlined into NODE.  */
3877
3878 int
3879 estimate_size_after_inlining (struct cgraph_node *node,
3880                               struct cgraph_edge *edge)
3881 {
3882   struct inline_edge_summary *es = inline_edge_summary (edge);
3883   if (!es->predicate || !false_predicate_p (es->predicate))
3884     {
3885       int size = inline_summaries->get (node)->size + estimate_edge_growth (edge);
3886       gcc_assert (size >= 0);
3887       return size;
3888     }
3889   return inline_summaries->get (node)->size;
3890 }
3891
3892
3893 struct growth_data
3894 {
3895   struct cgraph_node *node;
3896   bool self_recursive;
3897   bool uninlinable;
3898   int growth;
3899 };
3900
3901
3902 /* Worker for do_estimate_growth.  Collect growth for all callers.  */
3903
3904 static bool
3905 do_estimate_growth_1 (struct cgraph_node *node, void *data)
3906 {
3907   struct cgraph_edge *e;
3908   struct growth_data *d = (struct growth_data *) data;
3909
3910   for (e = node->callers; e; e = e->next_caller)
3911     {
3912       gcc_checking_assert (e->inline_failed);
3913
3914       if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
3915         {
3916           d->uninlinable = true;
3917           continue;
3918         }
3919
3920       if (e->recursive_p ())
3921         {
3922           d->self_recursive = true;
3923           continue;
3924         }
3925       d->growth += estimate_edge_growth (e);
3926     }
3927   return false;
3928 }
3929
3930
3931 /* Estimate the growth caused by inlining NODE into all callees.  */
3932
3933 int
3934 estimate_growth (struct cgraph_node *node)
3935 {
3936   struct growth_data d = { node, false, false, 0 };
3937   struct inline_summary *info = inline_summaries->get (node);
3938
3939   node->call_for_symbol_and_aliases (do_estimate_growth_1, &d, true);
3940
3941   /* For self recursive functions the growth estimation really should be
3942      infinity.  We don't want to return very large values because the growth
3943      plays various roles in badness computation fractions.  Be sure to not
3944      return zero or negative growths. */
3945   if (d.self_recursive)
3946     d.growth = d.growth < info->size ? info->size : d.growth;
3947   else if (DECL_EXTERNAL (node->decl) || d.uninlinable)
3948     ;
3949   else
3950     {
3951       if (node->will_be_removed_from_program_if_no_direct_calls_p ())
3952         d.growth -= info->size;
3953       /* COMDAT functions are very often not shared across multiple units
3954          since they come from various template instantiations.
3955          Take this into account.  */
3956       else if (DECL_COMDAT (node->decl)
3957                && node->can_remove_if_no_direct_calls_p ())
3958         d.growth -= (info->size
3959                      * (100 - PARAM_VALUE (PARAM_COMDAT_SHARING_PROBABILITY))
3960                      + 50) / 100;
3961     }
3962
3963   return d.growth;
3964 }
3965
3966 /* Verify if there are fewer than MAX_CALLERS.  */
3967
3968 static bool
3969 check_callers (cgraph_node *node, int *max_callers)
3970 {
3971   ipa_ref *ref;
3972
3973   if (!node->can_remove_if_no_direct_calls_and_refs_p ())
3974     return true;
3975
3976   for (cgraph_edge *e = node->callers; e; e = e->next_caller)
3977     {
3978       (*max_callers)--;
3979       if (!*max_callers
3980           || cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
3981         return true;
3982     }
3983
3984   FOR_EACH_ALIAS (node, ref)
3985     if (check_callers (dyn_cast <cgraph_node *> (ref->referring), max_callers))
3986       return true;
3987
3988   return false;
3989 }
3990
3991
3992 /* Make cheap estimation if growth of NODE is likely positive knowing
3993    EDGE_GROWTH of one particular edge.
3994    We assume that most of other edges will have similar growth
3995    and skip computation if there are too many callers.  */
3996
3997 bool
3998 growth_likely_positive (struct cgraph_node *node,
3999                         int edge_growth)
4000 {
4001   int max_callers;
4002   struct cgraph_edge *e;
4003   gcc_checking_assert (edge_growth > 0);
4004
4005   /* First quickly check if NODE is removable at all.  */
4006   if (DECL_EXTERNAL (node->decl))
4007     return true;
4008   if (!node->can_remove_if_no_direct_calls_and_refs_p ()
4009       || node->address_taken)
4010     return true;
4011
4012   max_callers = inline_summaries->get (node)->size * 4 / edge_growth + 2;
4013
4014   for (e = node->callers; e; e = e->next_caller)
4015     {
4016       max_callers--;
4017       if (!max_callers
4018           || cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
4019         return true;
4020     }
4021
4022   ipa_ref *ref;
4023   FOR_EACH_ALIAS (node, ref)
4024     if (check_callers (dyn_cast <cgraph_node *> (ref->referring), &max_callers))
4025       return true;
4026
4027   /* Unlike for functions called once, we play unsafe with
4028      COMDATs.  We can allow that since we know functions
4029      in consideration are small (and thus risk is small) and
4030      moreover grow estimates already accounts that COMDAT
4031      functions may or may not disappear when eliminated from
4032      current unit. With good probability making aggressive
4033      choice in all units is going to make overall program
4034      smaller.  */
4035   if (DECL_COMDAT (node->decl))
4036     {
4037       if (!node->can_remove_if_no_direct_calls_p ())
4038         return true;
4039     }
4040   else if (!node->will_be_removed_from_program_if_no_direct_calls_p ())
4041     return true;
4042
4043   return estimate_growth (node) > 0;
4044 }
4045
4046
4047 /* This function performs intraprocedural analysis in NODE that is required to
4048    inline indirect calls.  */
4049
4050 static void
4051 inline_indirect_intraprocedural_analysis (struct cgraph_node *node)
4052 {
4053   ipa_analyze_node (node);
4054   if (dump_file && (dump_flags & TDF_DETAILS))
4055     {
4056       ipa_print_node_params (dump_file, node);
4057       ipa_print_node_jump_functions (dump_file, node);
4058     }
4059 }
4060
4061
4062 /* Note function body size.  */
4063
4064 void
4065 inline_analyze_function (struct cgraph_node *node)
4066 {
4067   push_cfun (DECL_STRUCT_FUNCTION (node->decl));
4068
4069   if (dump_file)
4070     fprintf (dump_file, "\nAnalyzing function: %s/%u\n",
4071              node->name (), node->order);
4072   if (opt_for_fn (node->decl, optimize) && !node->thunk.thunk_p)
4073     inline_indirect_intraprocedural_analysis (node);
4074   compute_inline_parameters (node, false);
4075   if (!optimize)
4076     {
4077       struct cgraph_edge *e;
4078       for (e = node->callees; e; e = e->next_callee)
4079         {
4080           if (e->inline_failed == CIF_FUNCTION_NOT_CONSIDERED)
4081             e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
4082           e->call_stmt_cannot_inline_p = true;
4083         }
4084       for (e = node->indirect_calls; e; e = e->next_callee)
4085         {
4086           if (e->inline_failed == CIF_FUNCTION_NOT_CONSIDERED)
4087             e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
4088           e->call_stmt_cannot_inline_p = true;
4089         }
4090     }
4091
4092   pop_cfun ();
4093 }
4094
4095
4096 /* Called when new function is inserted to callgraph late.  */
4097
4098 void
4099 inline_summary_t::insert (struct cgraph_node *node, inline_summary *)
4100 {
4101   inline_analyze_function (node);
4102 }
4103
4104 /* Note function body size.  */
4105
4106 void
4107 inline_generate_summary (void)
4108 {
4109   struct cgraph_node *node;
4110
4111   FOR_EACH_DEFINED_FUNCTION (node)
4112     if (DECL_STRUCT_FUNCTION (node->decl))
4113       node->local.versionable = tree_versionable_function_p (node->decl);
4114
4115   /* When not optimizing, do not bother to analyze.  Inlining is still done
4116      because edge redirection needs to happen there.  */
4117   if (!optimize && !flag_generate_lto && !flag_generate_offload && !flag_wpa)
4118     return;
4119
4120   if (!inline_summaries)
4121     inline_summaries = (inline_summary_t*) inline_summary_t::create_ggc (symtab);
4122
4123   inline_summaries->enable_insertion_hook ();
4124
4125   ipa_register_cgraph_hooks ();
4126   inline_free_summary ();
4127
4128   FOR_EACH_DEFINED_FUNCTION (node)
4129     if (!node->alias)
4130       inline_analyze_function (node);
4131 }
4132
4133
4134 /* Read predicate from IB.  */
4135
4136 static struct predicate
4137 read_predicate (struct lto_input_block *ib)
4138 {
4139   struct predicate out;
4140   clause_t clause;
4141   int k = 0;
4142
4143   do
4144     {
4145       gcc_assert (k <= MAX_CLAUSES);
4146       clause = out.clause[k++] = streamer_read_uhwi (ib);
4147     }
4148   while (clause);
4149
4150   /* Zero-initialize the remaining clauses in OUT.  */
4151   while (k <= MAX_CLAUSES)
4152     out.clause[k++] = 0;
4153
4154   return out;
4155 }
4156
4157
4158 /* Write inline summary for edge E to OB.  */
4159
4160 static void
4161 read_inline_edge_summary (struct lto_input_block *ib, struct cgraph_edge *e)
4162 {
4163   struct inline_edge_summary *es = inline_edge_summary (e);
4164   struct predicate p;
4165   int length, i;
4166
4167   es->call_stmt_size = streamer_read_uhwi (ib);
4168   es->call_stmt_time = streamer_read_uhwi (ib);
4169   es->loop_depth = streamer_read_uhwi (ib);
4170   p = read_predicate (ib);
4171   edge_set_predicate (e, &p);
4172   length = streamer_read_uhwi (ib);
4173   if (length)
4174     {
4175       es->param.safe_grow_cleared (length);
4176       for (i = 0; i < length; i++)
4177         es->param[i].change_prob = streamer_read_uhwi (ib);
4178     }
4179 }
4180
4181
4182 /* Stream in inline summaries from the section.  */
4183
4184 static void
4185 inline_read_section (struct lto_file_decl_data *file_data, const char *data,
4186                      size_t len)
4187 {
4188   const struct lto_function_header *header =
4189     (const struct lto_function_header *) data;
4190   const int cfg_offset = sizeof (struct lto_function_header);
4191   const int main_offset = cfg_offset + header->cfg_size;
4192   const int string_offset = main_offset + header->main_size;
4193   struct data_in *data_in;
4194   unsigned int i, count2, j;
4195   unsigned int f_count;
4196
4197   lto_input_block ib ((const char *) data + main_offset, header->main_size,
4198                       file_data->mode_table);
4199
4200   data_in =
4201     lto_data_in_create (file_data, (const char *) data + string_offset,
4202                         header->string_size, vNULL);
4203   f_count = streamer_read_uhwi (&ib);
4204   for (i = 0; i < f_count; i++)
4205     {
4206       unsigned int index;
4207       struct cgraph_node *node;
4208       struct inline_summary *info;
4209       lto_symtab_encoder_t encoder;
4210       struct bitpack_d bp;
4211       struct cgraph_edge *e;
4212       predicate p;
4213
4214       index = streamer_read_uhwi (&ib);
4215       encoder = file_data->symtab_node_encoder;
4216       node = dyn_cast<cgraph_node *> (lto_symtab_encoder_deref (encoder,
4217                                                                 index));
4218       info = inline_summaries->get (node);
4219
4220       info->estimated_stack_size
4221         = info->estimated_self_stack_size = streamer_read_uhwi (&ib);
4222       info->size = info->self_size = streamer_read_uhwi (&ib);
4223       info->time = info->self_time = streamer_read_uhwi (&ib);
4224
4225       bp = streamer_read_bitpack (&ib);
4226       info->inlinable = bp_unpack_value (&bp, 1);
4227       info->contains_cilk_spawn = bp_unpack_value (&bp, 1);
4228
4229       count2 = streamer_read_uhwi (&ib);
4230       gcc_assert (!info->conds);
4231       for (j = 0; j < count2; j++)
4232         {
4233           struct condition c;
4234           c.operand_num = streamer_read_uhwi (&ib);
4235           c.code = (enum tree_code) streamer_read_uhwi (&ib);
4236           c.val = stream_read_tree (&ib, data_in);
4237           bp = streamer_read_bitpack (&ib);
4238           c.agg_contents = bp_unpack_value (&bp, 1);
4239           c.by_ref = bp_unpack_value (&bp, 1);
4240           if (c.agg_contents)
4241             c.offset = streamer_read_uhwi (&ib);
4242           vec_safe_push (info->conds, c);
4243         }
4244       count2 = streamer_read_uhwi (&ib);
4245       gcc_assert (!info->entry);
4246       for (j = 0; j < count2; j++)
4247         {
4248           struct size_time_entry e;
4249
4250           e.size = streamer_read_uhwi (&ib);
4251           e.time = streamer_read_uhwi (&ib);
4252           e.predicate = read_predicate (&ib);
4253
4254           vec_safe_push (info->entry, e);
4255         }
4256
4257       p = read_predicate (&ib);
4258       set_hint_predicate (&info->loop_iterations, p);
4259       p = read_predicate (&ib);
4260       set_hint_predicate (&info->loop_stride, p);
4261       p = read_predicate (&ib);
4262       set_hint_predicate (&info->array_index, p);
4263       for (e = node->callees; e; e = e->next_callee)
4264         read_inline_edge_summary (&ib, e);
4265       for (e = node->indirect_calls; e; e = e->next_callee)
4266         read_inline_edge_summary (&ib, e);
4267     }
4268
4269   lto_free_section_data (file_data, LTO_section_inline_summary, NULL, data,
4270                          len);
4271   lto_data_in_delete (data_in);
4272 }
4273
4274
4275 /* Read inline summary.  Jump functions are shared among ipa-cp
4276    and inliner, so when ipa-cp is active, we don't need to write them
4277    twice.  */
4278
4279 void
4280 inline_read_summary (void)
4281 {
4282   struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
4283   struct lto_file_decl_data *file_data;
4284   unsigned int j = 0;
4285
4286   inline_summary_alloc ();
4287
4288   while ((file_data = file_data_vec[j++]))
4289     {
4290       size_t len;
4291       const char *data = lto_get_section_data (file_data,
4292                                                LTO_section_inline_summary,
4293                                                NULL, &len);
4294       if (data)
4295         inline_read_section (file_data, data, len);
4296       else
4297         /* Fatal error here.  We do not want to support compiling ltrans units
4298            with different version of compiler or different flags than the WPA
4299            unit, so this should never happen.  */
4300         fatal_error (input_location,
4301                      "ipa inline summary is missing in input file");
4302     }
4303   if (optimize)
4304     {
4305       ipa_register_cgraph_hooks ();
4306       if (!flag_ipa_cp)
4307         ipa_prop_read_jump_functions ();
4308     }
4309
4310   gcc_assert (inline_summaries);
4311   inline_summaries->enable_insertion_hook ();
4312 }
4313
4314
4315 /* Write predicate P to OB.  */
4316
4317 static void
4318 write_predicate (struct output_block *ob, struct predicate *p)
4319 {
4320   int j;
4321   if (p)
4322     for (j = 0; p->clause[j]; j++)
4323       {
4324         gcc_assert (j < MAX_CLAUSES);
4325         streamer_write_uhwi (ob, p->clause[j]);
4326       }
4327   streamer_write_uhwi (ob, 0);
4328 }
4329
4330
4331 /* Write inline summary for edge E to OB.  */
4332
4333 static void
4334 write_inline_edge_summary (struct output_block *ob, struct cgraph_edge *e)
4335 {
4336   struct inline_edge_summary *es = inline_edge_summary (e);
4337   int i;
4338
4339   streamer_write_uhwi (ob, es->call_stmt_size);
4340   streamer_write_uhwi (ob, es->call_stmt_time);
4341   streamer_write_uhwi (ob, es->loop_depth);
4342   write_predicate (ob, es->predicate);
4343   streamer_write_uhwi (ob, es->param.length ());
4344   for (i = 0; i < (int) es->param.length (); i++)
4345     streamer_write_uhwi (ob, es->param[i].change_prob);
4346 }
4347
4348
4349 /* Write inline summary for node in SET.
4350    Jump functions are shared among ipa-cp and inliner, so when ipa-cp is
4351    active, we don't need to write them twice.  */
4352
4353 void
4354 inline_write_summary (void)
4355 {
4356   struct cgraph_node *node;
4357   struct output_block *ob = create_output_block (LTO_section_inline_summary);
4358   lto_symtab_encoder_t encoder = ob->decl_state->symtab_node_encoder;
4359   unsigned int count = 0;
4360   int i;
4361
4362   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4363     {
4364       symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
4365       cgraph_node *cnode = dyn_cast <cgraph_node *> (snode);
4366       if (cnode && cnode->definition && !cnode->alias)
4367         count++;
4368     }
4369   streamer_write_uhwi (ob, count);
4370
4371   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4372     {
4373       symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
4374       cgraph_node *cnode = dyn_cast <cgraph_node *> (snode);
4375       if (cnode && (node = cnode)->definition && !node->alias)
4376         {
4377           struct inline_summary *info = inline_summaries->get (node);
4378           struct bitpack_d bp;
4379           struct cgraph_edge *edge;
4380           int i;
4381           size_time_entry *e;
4382           struct condition *c;
4383
4384           streamer_write_uhwi (ob,
4385                                lto_symtab_encoder_encode (encoder,
4386
4387                                                           node));
4388           streamer_write_hwi (ob, info->estimated_self_stack_size);
4389           streamer_write_hwi (ob, info->self_size);
4390           streamer_write_hwi (ob, info->self_time);
4391           bp = bitpack_create (ob->main_stream);
4392           bp_pack_value (&bp, info->inlinable, 1);
4393           bp_pack_value (&bp, info->contains_cilk_spawn, 1);
4394           streamer_write_bitpack (&bp);
4395           streamer_write_uhwi (ob, vec_safe_length (info->conds));
4396           for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
4397             {
4398               streamer_write_uhwi (ob, c->operand_num);
4399               streamer_write_uhwi (ob, c->code);
4400               stream_write_tree (ob, c->val, true);
4401               bp = bitpack_create (ob->main_stream);
4402               bp_pack_value (&bp, c->agg_contents, 1);
4403               bp_pack_value (&bp, c->by_ref, 1);
4404               streamer_write_bitpack (&bp);
4405               if (c->agg_contents)
4406                 streamer_write_uhwi (ob, c->offset);
4407             }
4408           streamer_write_uhwi (ob, vec_safe_length (info->entry));
4409           for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
4410             {
4411               streamer_write_uhwi (ob, e->size);
4412               streamer_write_uhwi (ob, e->time);
4413               write_predicate (ob, &e->predicate);
4414             }
4415           write_predicate (ob, info->loop_iterations);
4416           write_predicate (ob, info->loop_stride);
4417           write_predicate (ob, info->array_index);
4418           for (edge = node->callees; edge; edge = edge->next_callee)
4419             write_inline_edge_summary (ob, edge);
4420           for (edge = node->indirect_calls; edge; edge = edge->next_callee)
4421             write_inline_edge_summary (ob, edge);
4422         }
4423     }
4424   streamer_write_char_stream (ob->main_stream, 0);
4425   produce_asm (ob, NULL);
4426   destroy_output_block (ob);
4427
4428   if (optimize && !flag_ipa_cp)
4429     ipa_prop_write_jump_functions ();
4430 }
4431
4432
4433 /* Release inline summary.  */
4434
4435 void
4436 inline_free_summary (void)
4437 {
4438   struct cgraph_node *node;
4439   if (edge_removal_hook_holder)
4440     symtab->remove_edge_removal_hook (edge_removal_hook_holder);
4441   edge_removal_hook_holder = NULL;
4442   if (edge_duplication_hook_holder)
4443     symtab->remove_edge_duplication_hook (edge_duplication_hook_holder);
4444   edge_duplication_hook_holder = NULL;
4445   if (!inline_edge_summary_vec.exists ())
4446     return;
4447   FOR_EACH_DEFINED_FUNCTION (node)
4448     if (!node->alias)
4449       reset_inline_summary (node, inline_summaries->get (node));
4450   inline_summaries->release ();
4451   inline_summaries = NULL;
4452   inline_edge_summary_vec.release ();
4453   edge_predicate_pool.release ();
4454 }