gcc/ipa-inline-analysis.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003-2016 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* Analysis used by the inliner and other passes limiting code size growth.
  22
  23    We estimate for each function
  24      - function body size
  25      - average function execution time
  26      - inlining size benefit (that is how much of function body size
  27        and its call sequence is expected to disappear by inlining)
  28      - inlining time benefit
  29      - function frame size
  30    For each call
  31      - call statement size and time
  32
  33    inlinie_summary datastructures store above information locally (i.e.
  34    parameters of the function itself) and globally (i.e. parameters of
  35    the function created by applying all the inline decisions already
  36    present in the callgraph).
  37
  38    We provide accestor to the inline_summary datastructure and
  39    basic logic updating the parameters when inlining is performed.
  40
  41    The summaries are context sensitive.  Context means
  42      1) partial assignment of known constant values of operands
  43      2) whether function is inlined into the call or not.
  44    It is easy to add more variants.  To represent function size and time
  45    that depends on context (i.e. it is known to be optimized away when
  46    context is known either by inlining or from IP-CP and clonning),
  47    we use predicates. Predicates are logical formulas in
  48    conjunctive-disjunctive form consisting of clauses. Clauses are bitmaps
  49    specifying what conditions must be true. Conditions are simple test
  50    of the form described above.
  51
  52    In order to make predicate (possibly) true, all of its clauses must
  53    be (possibly) true. To make clause (possibly) true, one of conditions
  54    it mentions must be (possibly) true.  There are fixed bounds on
  55    number of clauses and conditions and all the manipulation functions
  56    are conservative in positive direction. I.e. we may lose precision
  57    by thinking that predicate may be true even when it is not.
  58
  59    estimate_edge_size and estimate_edge_growth can be used to query
  60    function size/time in the given context.  inline_merge_summary merges
  61    properties of caller and callee after inlining.
  62
  63    Finally pass_inline_parameters is exported.  This is used to drive
  64    computation of function parameters used by the early inliner. IPA
  65    inlined performs analysis via its analyze_function method. */
  66
  67 #include "config.h"
  68 #include "system.h"
  69 #include "coretypes.h"
  70 #include "backend.h"
  71 #include "tree.h"
  72 #include "gimple.h"
  73 #include "alloc-pool.h"
  74 #include "tree-pass.h"
  75 #include "ssa.h"
  76 #include "tree-streamer.h"
  77 #include "cgraph.h"
  78 #include "diagnostic.h"
  79 #include "fold-const.h"
  80 #include "print-tree.h"
  81 #include "tree-inline.h"
  82 #include "gimple-pretty-print.h"
  83 #include "params.h"
  84 #include "cfganal.h"
  85 #include "gimple-iterator.h"
  86 #include "tree-cfg.h"
  87 #include "tree-ssa-loop-niter.h"
  88 #include "tree-ssa-loop.h"
  89 #include "symbol-summary.h"
  90 #include "ipa-prop.h"
  91 #include "ipa-inline.h"
  92 #include "cfgloop.h"
  93 #include "tree-scalar-evolution.h"
  94 #include "ipa-utils.h"
  95 #include "cilk.h"
  96 #include "cfgexpand.h"
  97 #include "gimplify.h"
  98
  99 /* Estimate runtime of function can easilly run into huge numbers with many
 100    nested loops.  Be sure we can compute time * INLINE_SIZE_SCALE * 2 in an
 101    integer.  For anything larger we use gcov_type.  */
 102 #define MAX_TIME 500000
 103
 104 /* Number of bits in integer, but we really want to be stable across different
 105    hosts.  */
 106 #define NUM_CONDITIONS 32
 107
 108 enum predicate_conditions
 109 {
 110   predicate_false_condition = 0,
 111   predicate_not_inlined_condition = 1,
 112   predicate_first_dynamic_condition = 2
 113 };
 114
 115 /* Special condition code we use to represent test that operand is compile time
 116    constant.  */
 117 #define IS_NOT_CONSTANT ERROR_MARK
 118 /* Special condition code we use to represent test that operand is not changed
 119    across invocation of the function.  When operand IS_NOT_CONSTANT it is always
 120    CHANGED, however i.e. loop invariants can be NOT_CHANGED given percentage
 121    of executions even when they are not compile time constants.  */
 122 #define CHANGED IDENTIFIER_NODE
 123
 124 /* Holders of ipa cgraph hooks: */
 125 static struct cgraph_2edge_hook_list *edge_duplication_hook_holder;
 126 static struct cgraph_edge_hook_list *edge_removal_hook_holder;
 127 static void inline_edge_removal_hook (struct cgraph_edge *, void *);
 128 static void inline_edge_duplication_hook (struct cgraph_edge *,
 129                                           struct cgraph_edge *, void *);
 130
 131 /* VECtor holding inline summaries.
 132    In GGC memory because conditions might point to constant trees.  */
 133 function_summary <inline_summary *> *inline_summaries;
 134 vec<inline_edge_summary_t> inline_edge_summary_vec;
 135
 136 /* Cached node/edge growths.  */
 137 vec<edge_growth_cache_entry> edge_growth_cache;
 138
 139 /* Edge predicates goes here.  */
 140 static object_allocator<predicate> edge_predicate_pool ("edge predicates");
 141
 142 /* Return true predicate (tautology).
 143    We represent it by empty list of clauses.  */
 144
 145 static inline struct predicate
 146 true_predicate (void)
 147 {
 148   struct predicate p;
 149   p.clause[0] = 0;
 150   return p;
 151 }
 152
 153
 154 /* Return predicate testing single condition number COND.  */
 155
 156 static inline struct predicate
 157 single_cond_predicate (int cond)
 158 {
 159   struct predicate p;
 160   p.clause[0] = 1 << cond;
 161   p.clause[1] = 0;
 162   return p;
 163 }
 164
 165
 166 /* Return false predicate.  First clause require false condition.  */
 167
 168 static inline struct predicate
 169 false_predicate (void)
 170 {
 171   return single_cond_predicate (predicate_false_condition);
 172 }
 173
 174
 175 /* Return true if P is (true).  */
 176
 177 static inline bool
 178 true_predicate_p (struct predicate *p)
 179 {
 180   return !p->clause[0];
 181 }
 182
 183
 184 /* Return true if P is (false).  */
 185
 186 static inline bool
 187 false_predicate_p (struct predicate *p)
 188 {
 189   if (p->clause[0] == (1 << predicate_false_condition))
 190     {
 191       gcc_checking_assert (!p->clause[1]
 192                            && p->clause[0] == 1 << predicate_false_condition);
 193       return true;
 194     }
 195   return false;
 196 }
 197
 198
 199 /* Return predicate that is set true when function is not inlined.  */
 200
 201 static inline struct predicate
 202 not_inlined_predicate (void)
 203 {
 204   return single_cond_predicate (predicate_not_inlined_condition);
 205 }
 206
 207 /* Simple description of whether a memory load or a condition refers to a load
 208    from an aggregate and if so, how and where from in the aggregate.
 209    Individual fields have the same meaning like fields with the same name in
 210    struct condition.  */
 211
 212 struct agg_position_info
 213 {
 214   HOST_WIDE_INT offset;
 215   bool agg_contents;
 216   bool by_ref;
 217 };
 218
 219 /* Add condition to condition list CONDS.  AGGPOS describes whether the used
 220    oprand is loaded from an aggregate and where in the aggregate it is.  It can
 221    be NULL, which means this not a load from an aggregate.  */
 222
 223 static struct predicate
 224 add_condition (struct inline_summary *summary, int operand_num,
 225                struct agg_position_info *aggpos,
 226                enum tree_code code, tree val)
 227 {
 228   int i;
 229   struct condition *c;
 230   struct condition new_cond;
 231   HOST_WIDE_INT offset;
 232   bool agg_contents, by_ref;
 233
 234   if (aggpos)
 235     {
 236       offset = aggpos->offset;
 237       agg_contents = aggpos->agg_contents;
 238       by_ref = aggpos->by_ref;
 239     }
 240   else
 241     {
 242       offset = 0;
 243       agg_contents = false;
 244       by_ref = false;
 245     }
 246
 247   gcc_checking_assert (operand_num >= 0);
 248   for (i = 0; vec_safe_iterate (summary->conds, i, &c); i++)
 249     {
 250       if (c->operand_num == operand_num
 251           && c->code == code
 252           && c->val == val
 253           && c->agg_contents == agg_contents
 254           && (!agg_contents || (c->offset == offset && c->by_ref == by_ref)))
 255         return single_cond_predicate (i + predicate_first_dynamic_condition);
 256     }
 257   /* Too many conditions.  Give up and return constant true.  */
 258   if (i == NUM_CONDITIONS - predicate_first_dynamic_condition)
 259     return true_predicate ();
 260
 261   new_cond.operand_num = operand_num;
 262   new_cond.code = code;
 263   new_cond.val = val;
 264   new_cond.agg_contents = agg_contents;
 265   new_cond.by_ref = by_ref;
 266   new_cond.offset = offset;
 267   vec_safe_push (summary->conds, new_cond);
 268   return single_cond_predicate (i + predicate_first_dynamic_condition);
 269 }
 270
 271
 272 /* Add clause CLAUSE into the predicate P.  */
 273
 274 static inline void
 275 add_clause (conditions conditions, struct predicate *p, clause_t clause)
 276 {
 277   int i;
 278   int i2;
 279   int insert_here = -1;
 280   int c1, c2;
 281
 282   /* True clause.  */
 283   if (!clause)
 284     return;
 285
 286   /* False clause makes the whole predicate false.  Kill the other variants.  */
 287   if (clause == (1 << predicate_false_condition))
 288     {
 289       p->clause[0] = (1 << predicate_false_condition);
 290       p->clause[1] = 0;
 291       return;
 292     }
 293   if (false_predicate_p (p))
 294     return;
 295
 296   /* No one should be silly enough to add false into nontrivial clauses.  */
 297   gcc_checking_assert (!(clause & (1 << predicate_false_condition)));
 298
 299   /* Look where to insert the clause.  At the same time prune out
 300      clauses of P that are implied by the new clause and thus
 301      redundant.  */
 302   for (i = 0, i2 = 0; i <= MAX_CLAUSES; i++)
 303     {
 304       p->clause[i2] = p->clause[i];
 305
 306       if (!p->clause[i])
 307         break;
 308
 309       /* If p->clause[i] implies clause, there is nothing to add.  */
 310       if ((p->clause[i] & clause) == p->clause[i])
 311         {
 312           /* We had nothing to add, none of clauses should've become
 313              redundant.  */
 314           gcc_checking_assert (i == i2);
 315           return;
 316         }
 317
 318       if (p->clause[i] < clause && insert_here < 0)
 319         insert_here = i2;
 320
 321       /* If clause implies p->clause[i], then p->clause[i] becomes redundant.
 322          Otherwise the p->clause[i] has to stay.  */
 323       if ((p->clause[i] & clause) != clause)
 324         i2++;
 325     }
 326
 327   /* Look for clauses that are obviously true.  I.e.
 328      op0 == 5 || op0 != 5.  */
 329   for (c1 = predicate_first_dynamic_condition; c1 < NUM_CONDITIONS; c1++)
 330     {
 331       condition *cc1;
 332       if (!(clause & (1 << c1)))
 333         continue;
 334       cc1 = &(*conditions)[c1 - predicate_first_dynamic_condition];
 335       /* We have no way to represent !CHANGED and !IS_NOT_CONSTANT
 336          and thus there is no point for looking for them.  */
 337       if (cc1->code == CHANGED || cc1->code == IS_NOT_CONSTANT)
 338         continue;
 339       for (c2 = c1 + 1; c2 < NUM_CONDITIONS; c2++)
 340         if (clause & (1 << c2))
 341           {
 342             condition *cc1 =
 343               &(*conditions)[c1 - predicate_first_dynamic_condition];
 344             condition *cc2 =
 345               &(*conditions)[c2 - predicate_first_dynamic_condition];
 346             if (cc1->operand_num == cc2->operand_num
 347                 && cc1->val == cc2->val
 348                 && cc2->code != IS_NOT_CONSTANT
 349                 && cc2->code != CHANGED
 350                 && cc1->code == invert_tree_comparison (cc2->code,
 351                                                         HONOR_NANS (cc1->val)))
 352               return;
 353           }
 354     }
 355
 356
 357   /* We run out of variants.  Be conservative in positive direction.  */
 358   if (i2 == MAX_CLAUSES)
 359     return;
 360   /* Keep clauses in decreasing order. This makes equivalence testing easy.  */
 361   p->clause[i2 + 1] = 0;
 362   if (insert_here >= 0)
 363     for (; i2 > insert_here; i2--)
 364       p->clause[i2] = p->clause[i2 - 1];
 365   else
 366     insert_here = i2;
 367   p->clause[insert_here] = clause;
 368 }
 369
 370
 371 /* Return P & P2.  */
 372
 373 static struct predicate
 374 and_predicates (conditions conditions,
 375                 struct predicate *p, struct predicate *p2)
 376 {
 377   struct predicate out = *p;
 378   int i;
 379
 380   /* Avoid busy work.  */
 381   if (false_predicate_p (p2) || true_predicate_p (p))
 382     return *p2;
 383   if (false_predicate_p (p) || true_predicate_p (p2))
 384     return *p;
 385
 386   /* See how far predicates match.  */
 387   for (i = 0; p->clause[i] && p->clause[i] == p2->clause[i]; i++)
 388     {
 389       gcc_checking_assert (i < MAX_CLAUSES);
 390     }
 391
 392   /* Combine the predicates rest.  */
 393   for (; p2->clause[i]; i++)
 394     {
 395       gcc_checking_assert (i < MAX_CLAUSES);
 396       add_clause (conditions, &out, p2->clause[i]);
 397     }
 398   return out;
 399 }
 400
 401
 402 /* Return true if predicates are obviously equal.  */
 403
 404 static inline bool
 405 predicates_equal_p (struct predicate *p, struct predicate *p2)
 406 {
 407   int i;
 408   for (i = 0; p->clause[i]; i++)
 409     {
 410       gcc_checking_assert (i < MAX_CLAUSES);
 411       gcc_checking_assert (p->clause[i] > p->clause[i + 1]);
 412       gcc_checking_assert (!p2->clause[i]
 413                            || p2->clause[i] > p2->clause[i + 1]);
 414       if (p->clause[i] != p2->clause[i])
 415         return false;
 416     }
 417   return !p2->clause[i];
 418 }
 419
 420
 421 /* Return P | P2.  */
 422
 423 static struct predicate
 424 or_predicates (conditions conditions,
 425                struct predicate *p, struct predicate *p2)
 426 {
 427   struct predicate out = true_predicate ();
 428   int i, j;
 429
 430   /* Avoid busy work.  */
 431   if (false_predicate_p (p2) || true_predicate_p (p))
 432     return *p;
 433   if (false_predicate_p (p) || true_predicate_p (p2))
 434     return *p2;
 435   if (predicates_equal_p (p, p2))
 436     return *p;
 437
 438   /* OK, combine the predicates.  */
 439   for (i = 0; p->clause[i]; i++)
 440     for (j = 0; p2->clause[j]; j++)
 441       {
 442         gcc_checking_assert (i < MAX_CLAUSES && j < MAX_CLAUSES);
 443         add_clause (conditions, &out, p->clause[i] | p2->clause[j]);
 444       }
 445   return out;
 446 }
 447
 448
 449 /* Having partial truth assignment in POSSIBLE_TRUTHS, return false
 450    if predicate P is known to be false.  */
 451
 452 static bool
 453 evaluate_predicate (struct predicate *p, clause_t possible_truths)
 454 {
 455   int i;
 456
 457   /* True remains true.  */
 458   if (true_predicate_p (p))
 459     return true;
 460
 461   gcc_assert (!(possible_truths & (1 << predicate_false_condition)));
 462
 463   /* See if we can find clause we can disprove.  */
 464   for (i = 0; p->clause[i]; i++)
 465     {
 466       gcc_checking_assert (i < MAX_CLAUSES);
 467       if (!(p->clause[i] & possible_truths))
 468         return false;
 469     }
 470   return true;
 471 }
 472
 473 /* Return the probability in range 0...REG_BR_PROB_BASE that the predicated
 474    instruction will be recomputed per invocation of the inlined call.  */
 475
 476 static int
 477 predicate_probability (conditions conds,
 478                        struct predicate *p, clause_t possible_truths,
 479                        vec<inline_param_summary> inline_param_summary)
 480 {
 481   int i;
 482   int combined_prob = REG_BR_PROB_BASE;
 483
 484   /* True remains true.  */
 485   if (true_predicate_p (p))
 486     return REG_BR_PROB_BASE;
 487
 488   if (false_predicate_p (p))
 489     return 0;
 490
 491   gcc_assert (!(possible_truths & (1 << predicate_false_condition)));
 492
 493   /* See if we can find clause we can disprove.  */
 494   for (i = 0; p->clause[i]; i++)
 495     {
 496       gcc_checking_assert (i < MAX_CLAUSES);
 497       if (!(p->clause[i] & possible_truths))
 498         return 0;
 499       else
 500         {
 501           int this_prob = 0;
 502           int i2;
 503           if (!inline_param_summary.exists ())
 504             return REG_BR_PROB_BASE;
 505           for (i2 = 0; i2 < NUM_CONDITIONS; i2++)
 506             if ((p->clause[i] & possible_truths) & (1 << i2))
 507               {
 508                 if (i2 >= predicate_first_dynamic_condition)
 509                   {
 510                     condition *c =
 511                       &(*conds)[i2 - predicate_first_dynamic_condition];
 512                     if (c->code == CHANGED
 513                         && (c->operand_num <
 514                             (int) inline_param_summary.length ()))
 515                       {
 516                         int iprob =
 517                           inline_param_summary[c->operand_num].change_prob;
 518                         this_prob = MAX (this_prob, iprob);
 519                       }
 520                     else
 521                       this_prob = REG_BR_PROB_BASE;
 522                   }
 523                 else
 524                   this_prob = REG_BR_PROB_BASE;
 525               }
 526           combined_prob = MIN (this_prob, combined_prob);
 527           if (!combined_prob)
 528             return 0;
 529         }
 530     }
 531   return combined_prob;
 532 }
 533
 534
 535 /* Dump conditional COND.  */
 536
 537 static void
 538 dump_condition (FILE *f, conditions conditions, int cond)
 539 {
 540   condition *c;
 541   if (cond == predicate_false_condition)
 542     fprintf (f, "false");
 543   else if (cond == predicate_not_inlined_condition)
 544     fprintf (f, "not inlined");
 545   else
 546     {
 547       c = &(*conditions)[cond - predicate_first_dynamic_condition];
 548       fprintf (f, "op%i", c->operand_num);
 549       if (c->agg_contents)
 550         fprintf (f, "[%soffset: " HOST_WIDE_INT_PRINT_DEC "]",
 551                  c->by_ref ? "ref " : "", c->offset);
 552       if (c->code == IS_NOT_CONSTANT)
 553         {
 554           fprintf (f, " not constant");
 555           return;
 556         }
 557       if (c->code == CHANGED)
 558         {
 559           fprintf (f, " changed");
 560           return;
 561         }
 562       fprintf (f, " %s ", op_symbol_code (c->code));
 563       print_generic_expr (f, c->val, 1);
 564     }
 565 }
 566
 567
 568 /* Dump clause CLAUSE.  */
 569
 570 static void
 571 dump_clause (FILE *f, conditions conds, clause_t clause)
 572 {
 573   int i;
 574   bool found = false;
 575   fprintf (f, "(");
 576   if (!clause)
 577     fprintf (f, "true");
 578   for (i = 0; i < NUM_CONDITIONS; i++)
 579     if (clause & (1 << i))
 580       {
 581         if (found)
 582           fprintf (f, " || ");
 583         found = true;
 584         dump_condition (f, conds, i);
 585       }
 586   fprintf (f, ")");
 587 }
 588
 589
 590 /* Dump predicate PREDICATE.  */
 591
 592 static void
 593 dump_predicate (FILE *f, conditions conds, struct predicate *pred)
 594 {
 595   int i;
 596   if (true_predicate_p (pred))
 597     dump_clause (f, conds, 0);
 598   else
 599     for (i = 0; pred->clause[i]; i++)
 600       {
 601         if (i)
 602           fprintf (f, " && ");
 603         dump_clause (f, conds, pred->clause[i]);
 604       }
 605   fprintf (f, "\n");
 606 }
 607
 608
 609 /* Dump inline hints.  */
 610 void
 611 dump_inline_hints (FILE *f, inline_hints hints)
 612 {
 613   if (!hints)
 614     return;
 615   fprintf (f, "inline hints:");
 616   if (hints & INLINE_HINT_indirect_call)
 617     {
 618       hints &= ~INLINE_HINT_indirect_call;
 619       fprintf (f, " indirect_call");
 620     }
 621   if (hints & INLINE_HINT_loop_iterations)
 622     {
 623       hints &= ~INLINE_HINT_loop_iterations;
 624       fprintf (f, " loop_iterations");
 625     }
 626   if (hints & INLINE_HINT_loop_stride)
 627     {
 628       hints &= ~INLINE_HINT_loop_stride;
 629       fprintf (f, " loop_stride");
 630     }
 631   if (hints & INLINE_HINT_same_scc)
 632     {
 633       hints &= ~INLINE_HINT_same_scc;
 634       fprintf (f, " same_scc");
 635     }
 636   if (hints & INLINE_HINT_in_scc)
 637     {
 638       hints &= ~INLINE_HINT_in_scc;
 639       fprintf (f, " in_scc");
 640     }
 641   if (hints & INLINE_HINT_cross_module)
 642     {
 643       hints &= ~INLINE_HINT_cross_module;
 644       fprintf (f, " cross_module");
 645     }
 646   if (hints & INLINE_HINT_declared_inline)
 647     {
 648       hints &= ~INLINE_HINT_declared_inline;
 649       fprintf (f, " declared_inline");
 650     }
 651   if (hints & INLINE_HINT_array_index)
 652     {
 653       hints &= ~INLINE_HINT_array_index;
 654       fprintf (f, " array_index");
 655     }
 656   if (hints & INLINE_HINT_known_hot)
 657     {
 658       hints &= ~INLINE_HINT_known_hot;
 659       fprintf (f, " known_hot");
 660     }
 661   gcc_assert (!hints);
 662 }
 663
 664
 665 /* Record SIZE and TIME under condition PRED into the inline summary.  */
 666
 667 static void
 668 account_size_time (struct inline_summary *summary, int size, int time,
 669                    struct predicate *pred)
 670 {
 671   size_time_entry *e;
 672   bool found = false;
 673   int i;
 674
 675   if (false_predicate_p (pred))
 676     return;
 677
 678   /* We need to create initial empty unconitional clause, but otherwie
 679      we don't need to account empty times and sizes.  */
 680   if (!size && !time && summary->entry)
 681     return;
 682
 683   /* Watch overflow that might result from insane profiles.  */
 684   if (time > MAX_TIME * INLINE_TIME_SCALE)
 685     time = MAX_TIME * INLINE_TIME_SCALE;
 686   gcc_assert (time >= 0);
 687
 688   for (i = 0; vec_safe_iterate (summary->entry, i, &e); i++)
 689     if (predicates_equal_p (&e->predicate, pred))
 690       {
 691         found = true;
 692         break;
 693       }
 694   if (i == 256)
 695     {
 696       i = 0;
 697       found = true;
 698       e = &(*summary->entry)[0];
 699       gcc_assert (!e->predicate.clause[0]);
 700       if (dump_file && (dump_flags & TDF_DETAILS))
 701         fprintf (dump_file,
 702                  "\t\tReached limit on number of entries, "
 703                  "ignoring the predicate.");
 704     }
 705   if (dump_file && (dump_flags & TDF_DETAILS) && (time || size))
 706     {
 707       fprintf (dump_file,
 708                "\t\tAccounting size:%3.2f, time:%3.2f on %spredicate:",
 709                ((double) size) / INLINE_SIZE_SCALE,
 710                ((double) time) / INLINE_TIME_SCALE, found ? "" : "new ");
 711       dump_predicate (dump_file, summary->conds, pred);
 712     }
 713   if (!found)
 714     {
 715       struct size_time_entry new_entry;
 716       new_entry.size = size;
 717       new_entry.time = time;
 718       new_entry.predicate = *pred;
 719       vec_safe_push (summary->entry, new_entry);
 720     }
 721   else
 722     {
 723       e->size += size;
 724       e->time += time;
 725       if (e->time > MAX_TIME * INLINE_TIME_SCALE)
 726         e->time = MAX_TIME * INLINE_TIME_SCALE;
 727     }
 728 }
 729
 730 /* We proved E to be unreachable, redirect it to __bultin_unreachable.  */
 731
 732 static struct cgraph_edge *
 733 redirect_to_unreachable (struct cgraph_edge *e)
 734 {
 735   struct cgraph_node *callee = !e->inline_failed ? e->callee : NULL;
 736   struct cgraph_node *target = cgraph_node::get_create
 737                       (builtin_decl_implicit (BUILT_IN_UNREACHABLE));
 738
 739   if (e->speculative)
 740     e = e->resolve_speculation (target->decl);
 741   else if (!e->callee)
 742     e->make_direct (target);
 743   else
 744     e->redirect_callee (target);
 745   struct inline_edge_summary *es = inline_edge_summary (e);
 746   e->inline_failed = CIF_UNREACHABLE;
 747   e->frequency = 0;
 748   e->count = 0;
 749   es->call_stmt_size = 0;
 750   es->call_stmt_time = 0;
 751   if (callee)
 752     callee->remove_symbol_and_inline_clones ();
 753   return e;
 754 }
 755
 756 /* Set predicate for edge E.  */
 757
 758 static void
 759 edge_set_predicate (struct cgraph_edge *e, struct predicate *predicate)
 760 {
 761   /* If the edge is determined to be never executed, redirect it
 762      to BUILTIN_UNREACHABLE to save inliner from inlining into it.  */
 763   if (predicate && false_predicate_p (predicate)
 764       /* When handling speculative edges, we need to do the redirection
 765          just once.  Do it always on the direct edge, so we do not
 766          attempt to resolve speculation while duplicating the edge.  */
 767       && (!e->speculative || e->callee))
 768     e = redirect_to_unreachable (e);
 769
 770   struct inline_edge_summary *es = inline_edge_summary (e);
 771   if (predicate && !true_predicate_p (predicate))
 772     {
 773       if (!es->predicate)
 774         es->predicate = edge_predicate_pool.allocate ();
 775       *es->predicate = *predicate;
 776     }
 777   else
 778     {
 779       if (es->predicate)
 780         edge_predicate_pool.remove (es->predicate);
 781       es->predicate = NULL;
 782     }
 783 }
 784
 785 /* Set predicate for hint *P.  */
 786
 787 static void
 788 set_hint_predicate (struct predicate **p, struct predicate new_predicate)
 789 {
 790   if (false_predicate_p (&new_predicate) || true_predicate_p (&new_predicate))
 791     {
 792       if (*p)
 793         edge_predicate_pool.remove (*p);
 794       *p = NULL;
 795     }
 796   else
 797     {
 798       if (!*p)
 799         *p = edge_predicate_pool.allocate ();
 800       **p = new_predicate;
 801     }
 802 }
 803
 804
 805 /* KNOWN_VALS is partial mapping of parameters of NODE to constant values.
 806    KNOWN_AGGS is a vector of aggreggate jump functions for each parameter.
 807    Return clause of possible truths. When INLINE_P is true, assume that we are
 808    inlining.
 809
 810    ERROR_MARK means compile time invariant.  */
 811
 812 static clause_t
 813 evaluate_conditions_for_known_args (struct cgraph_node *node,
 814                                     bool inline_p,
 815                                     vec<tree> known_vals,
 816                                     vec<ipa_agg_jump_function_p>
 817                                     known_aggs)
 818 {
 819   clause_t clause = inline_p ? 0 : 1 << predicate_not_inlined_condition;
 820   struct inline_summary *info = inline_summaries->get (node);
 821   int i;
 822   struct condition *c;
 823
 824   for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
 825     {
 826       tree val;
 827       tree res;
 828
 829       /* We allow call stmt to have fewer arguments than the callee function
 830          (especially for K&R style programs).  So bound check here (we assume
 831          known_aggs vector, if non-NULL, has the same length as
 832          known_vals).  */
 833       gcc_checking_assert (!known_aggs.exists ()
 834                            || (known_vals.length () == known_aggs.length ()));
 835       if (c->operand_num >= (int) known_vals.length ())
 836         {
 837           clause |= 1 << (i + predicate_first_dynamic_condition);
 838           continue;
 839         }
 840
 841       if (c->agg_contents)
 842         {
 843           struct ipa_agg_jump_function *agg;
 844
 845           if (c->code == CHANGED
 846               && !c->by_ref
 847               && (known_vals[c->operand_num] == error_mark_node))
 848             continue;
 849
 850           if (known_aggs.exists ())
 851             {
 852               agg = known_aggs[c->operand_num];
 853               val = ipa_find_agg_cst_for_param (agg, c->offset, c->by_ref);
 854             }
 855           else
 856             val = NULL_TREE;
 857         }
 858       else
 859         {
 860           val = known_vals[c->operand_num];
 861           if (val == error_mark_node && c->code != CHANGED)
 862             val = NULL_TREE;
 863         }
 864
 865       if (!val)
 866         {
 867           clause |= 1 << (i + predicate_first_dynamic_condition);
 868           continue;
 869         }
 870       if (c->code == IS_NOT_CONSTANT || c->code == CHANGED)
 871         continue;
 872
 873       if (operand_equal_p (TYPE_SIZE (TREE_TYPE (c->val)),
 874                            TYPE_SIZE (TREE_TYPE (val)), 0))
 875         {
 876           val = fold_unary (VIEW_CONVERT_EXPR, TREE_TYPE (c->val), val);
 877
 878           res = val
 879             ? fold_binary_to_constant (c->code, boolean_type_node, val, c->val)
 880             : NULL;
 881
 882           if (res && integer_zerop (res))
 883             continue;
 884         }
 885       clause |= 1 << (i + predicate_first_dynamic_condition);
 886     }
 887   return clause;
 888 }
 889
 890
 891 /* Work out what conditions might be true at invocation of E.  */
 892
 893 static void
 894 evaluate_properties_for_edge (struct cgraph_edge *e, bool inline_p,
 895                               clause_t *clause_ptr,
 896                               vec<tree> *known_vals_ptr,
 897                               vec<ipa_polymorphic_call_context>
 898                               *known_contexts_ptr,
 899                               vec<ipa_agg_jump_function_p> *known_aggs_ptr)
 900 {
 901   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 902   struct inline_summary *info = inline_summaries->get (callee);
 903   vec<tree> known_vals = vNULL;
 904   vec<ipa_agg_jump_function_p> known_aggs = vNULL;
 905
 906   if (clause_ptr)
 907     *clause_ptr = inline_p ? 0 : 1 << predicate_not_inlined_condition;
 908   if (known_vals_ptr)
 909     known_vals_ptr->create (0);
 910   if (known_contexts_ptr)
 911     known_contexts_ptr->create (0);
 912
 913   if (ipa_node_params_sum
 914       && !e->call_stmt_cannot_inline_p
 915       && ((clause_ptr && info->conds) || known_vals_ptr || known_contexts_ptr))
 916     {
 917       struct ipa_node_params *parms_info;
 918       struct ipa_edge_args *args = IPA_EDGE_REF (e);
 919       struct inline_edge_summary *es = inline_edge_summary (e);
 920       int i, count = ipa_get_cs_argument_count (args);
 921
 922       if (e->caller->global.inlined_to)
 923         parms_info = IPA_NODE_REF (e->caller->global.inlined_to);
 924       else
 925         parms_info = IPA_NODE_REF (e->caller);
 926
 927       if (count && (info->conds || known_vals_ptr))
 928         known_vals.safe_grow_cleared (count);
 929       if (count && (info->conds || known_aggs_ptr))
 930         known_aggs.safe_grow_cleared (count);
 931       if (count && known_contexts_ptr)
 932         known_contexts_ptr->safe_grow_cleared (count);
 933
 934       for (i = 0; i < count; i++)
 935         {
 936           struct ipa_jump_func *jf = ipa_get_ith_jump_func (args, i);
 937           tree cst = ipa_value_from_jfunc (parms_info, jf);
 938
 939           if (!cst && e->call_stmt
 940               && i < (int)gimple_call_num_args (e->call_stmt))
 941             {
 942               cst = gimple_call_arg (e->call_stmt, i);
 943               if (!is_gimple_min_invariant (cst))
 944                 cst = NULL;
 945             }
 946           if (cst)
 947             {
 948               gcc_checking_assert (TREE_CODE (cst) != TREE_BINFO);
 949               if (known_vals.exists ())
 950                 known_vals[i] = cst;
 951             }
 952           else if (inline_p && !es->param[i].change_prob)
 953             known_vals[i] = error_mark_node;
 954
 955           if (known_contexts_ptr)
 956             (*known_contexts_ptr)[i] = ipa_context_from_jfunc (parms_info, e,
 957                                                                i, jf);
 958           /* TODO: When IPA-CP starts propagating and merging aggregate jump
 959              functions, use its knowledge of the caller too, just like the
 960              scalar case above.  */
 961           known_aggs[i] = &jf->agg;
 962         }
 963     }
 964   else if (e->call_stmt && !e->call_stmt_cannot_inline_p
 965            && ((clause_ptr && info->conds) || known_vals_ptr))
 966     {
 967       int i, count = (int)gimple_call_num_args (e->call_stmt);
 968
 969       if (count && (info->conds || known_vals_ptr))
 970         known_vals.safe_grow_cleared (count);
 971       for (i = 0; i < count; i++)
 972         {
 973           tree cst = gimple_call_arg (e->call_stmt, i);
 974           if (!is_gimple_min_invariant (cst))
 975             cst = NULL;
 976           if (cst)
 977             known_vals[i] = cst;
 978         }
 979     }
 980
 981   if (clause_ptr)
 982     *clause_ptr = evaluate_conditions_for_known_args (callee, inline_p,
 983                                                       known_vals, known_aggs);
 984
 985   if (known_vals_ptr)
 986     *known_vals_ptr = known_vals;
 987   else
 988     known_vals.release ();
 989
 990   if (known_aggs_ptr)
 991     *known_aggs_ptr = known_aggs;
 992   else
 993     known_aggs.release ();
 994 }
 995
 996
 997 /* Allocate the inline summary vector or resize it to cover all cgraph nodes. */
 998
 999 static void
1000 inline_summary_alloc (void)
1001 {
1002   if (!edge_removal_hook_holder)
1003     edge_removal_hook_holder =
1004       symtab->add_edge_removal_hook (&inline_edge_removal_hook, NULL);
1005   if (!edge_duplication_hook_holder)
1006     edge_duplication_hook_holder =
1007       symtab->add_edge_duplication_hook (&inline_edge_duplication_hook, NULL);
1008
1009   if (!inline_summaries)
1010     inline_summaries = (inline_summary_t*) inline_summary_t::create_ggc (symtab);
1011
1012   if (inline_edge_summary_vec.length () <= (unsigned) symtab->edges_max_uid)
1013     inline_edge_summary_vec.safe_grow_cleared (symtab->edges_max_uid + 1);
1014 }
1015
1016 /* We are called multiple time for given function; clear
1017    data from previous run so they are not cumulated.  */
1018
1019 static void
1020 reset_inline_edge_summary (struct cgraph_edge *e)
1021 {
1022   if (e->uid < (int) inline_edge_summary_vec.length ())
1023     {
1024       struct inline_edge_summary *es = inline_edge_summary (e);
1025
1026       es->call_stmt_size = es->call_stmt_time = 0;
1027       if (es->predicate)
1028         edge_predicate_pool.remove (es->predicate);
1029       es->predicate = NULL;
1030       es->param.release ();
1031     }
1032 }
1033
1034 /* We are called multiple time for given function; clear
1035    data from previous run so they are not cumulated.  */
1036
1037 static void
1038 reset_inline_summary (struct cgraph_node *node,
1039                       inline_summary *info)
1040 {
1041   struct cgraph_edge *e;
1042
1043   info->self_size = info->self_time = 0;
1044   info->estimated_stack_size = 0;
1045   info->estimated_self_stack_size = 0;
1046   info->stack_frame_offset = 0;
1047   info->size = 0;
1048   info->time = 0;
1049   info->growth = 0;
1050   info->scc_no = 0;
1051   if (info->loop_iterations)
1052     {
1053       edge_predicate_pool.remove (info->loop_iterations);
1054       info->loop_iterations = NULL;
1055     }
1056   if (info->loop_stride)
1057     {
1058       edge_predicate_pool.remove (info->loop_stride);
1059       info->loop_stride = NULL;
1060     }
1061   if (info->array_index)
1062     {
1063       edge_predicate_pool.remove (info->array_index);
1064       info->array_index = NULL;
1065     }
1066   vec_free (info->conds);
1067   vec_free (info->entry);
1068   for (e = node->callees; e; e = e->next_callee)
1069     reset_inline_edge_summary (e);
1070   for (e = node->indirect_calls; e; e = e->next_callee)
1071     reset_inline_edge_summary (e);
1072   info->fp_expressions = false;
1073 }
1074
1075 /* Hook that is called by cgraph.c when a node is removed.  */
1076
1077 void
1078 inline_summary_t::remove (cgraph_node *node, inline_summary *info)
1079 {
1080   reset_inline_summary (node, info);
1081 }
1082
1083 /* Remap predicate P of former function to be predicate of duplicated function.
1084    POSSIBLE_TRUTHS is clause of possible truths in the duplicated node,
1085    INFO is inline summary of the duplicated node.  */
1086
1087 static struct predicate
1088 remap_predicate_after_duplication (struct predicate *p,
1089                                    clause_t possible_truths,
1090                                    struct inline_summary *info)
1091 {
1092   struct predicate new_predicate = true_predicate ();
1093   int j;
1094   for (j = 0; p->clause[j]; j++)
1095     if (!(possible_truths & p->clause[j]))
1096       {
1097         new_predicate = false_predicate ();
1098         break;
1099       }
1100     else
1101       add_clause (info->conds, &new_predicate,
1102                   possible_truths & p->clause[j]);
1103   return new_predicate;
1104 }
1105
1106 /* Same as remap_predicate_after_duplication but handle hint predicate *P.
1107    Additionally care about allocating new memory slot for updated predicate
1108    and set it to NULL when it becomes true or false (and thus uninteresting).
1109  */
1110
1111 static void
1112 remap_hint_predicate_after_duplication (struct predicate **p,
1113                                         clause_t possible_truths,
1114                                         struct inline_summary *info)
1115 {
1116   struct predicate new_predicate;
1117
1118   if (!*p)
1119     return;
1120
1121   new_predicate = remap_predicate_after_duplication (*p,
1122                                                      possible_truths, info);
1123   /* We do not want to free previous predicate; it is used by node origin.  */
1124   *p = NULL;
1125   set_hint_predicate (p, new_predicate);
1126 }
1127
1128
1129 /* Hook that is called by cgraph.c when a node is duplicated.  */
1130 void
1131 inline_summary_t::duplicate (cgraph_node *src,
1132                              cgraph_node *dst,
1133                              inline_summary *,
1134                              inline_summary *info)
1135 {
1136   inline_summary_alloc ();
1137   memcpy (info, inline_summaries->get (src), sizeof (inline_summary));
1138   /* TODO: as an optimization, we may avoid copying conditions
1139      that are known to be false or true.  */
1140   info->conds = vec_safe_copy (info->conds);
1141
1142   /* When there are any replacements in the function body, see if we can figure
1143      out that something was optimized out.  */
1144   if (ipa_node_params_sum && dst->clone.tree_map)
1145     {
1146       vec<size_time_entry, va_gc> *entry = info->entry;
1147       /* Use SRC parm info since it may not be copied yet.  */
1148       struct ipa_node_params *parms_info = IPA_NODE_REF (src);
1149       vec<tree> known_vals = vNULL;
1150       int count = ipa_get_param_count (parms_info);
1151       int i, j;
1152       clause_t possible_truths;
1153       struct predicate true_pred = true_predicate ();
1154       size_time_entry *e;
1155       int optimized_out_size = 0;
1156       bool inlined_to_p = false;
1157       struct cgraph_edge *edge, *next;
1158
1159       info->entry = 0;
1160       known_vals.safe_grow_cleared (count);
1161       for (i = 0; i < count; i++)
1162         {
1163           struct ipa_replace_map *r;
1164
1165           for (j = 0; vec_safe_iterate (dst->clone.tree_map, j, &r); j++)
1166             {
1167               if (((!r->old_tree && r->parm_num == i)
1168                    || (r->old_tree && r->old_tree == ipa_get_param (parms_info, i)))
1169                    && r->replace_p && !r->ref_p)
1170                 {
1171                   known_vals[i] = r->new_tree;
1172                   break;
1173                 }
1174             }
1175         }
1176       possible_truths = evaluate_conditions_for_known_args (dst, false,
1177                                                             known_vals,
1178                                                             vNULL);
1179       known_vals.release ();
1180
1181       account_size_time (info, 0, 0, &true_pred);
1182
1183       /* Remap size_time vectors.
1184          Simplify the predicate by prunning out alternatives that are known
1185          to be false.
1186          TODO: as on optimization, we can also eliminate conditions known
1187          to be true.  */
1188       for (i = 0; vec_safe_iterate (entry, i, &e); i++)
1189         {
1190           struct predicate new_predicate;
1191           new_predicate = remap_predicate_after_duplication (&e->predicate,
1192                                                              possible_truths,
1193                                                              info);
1194           if (false_predicate_p (&new_predicate))
1195             optimized_out_size += e->size;
1196           else
1197             account_size_time (info, e->size, e->time, &new_predicate);
1198         }
1199
1200       /* Remap edge predicates with the same simplification as above.
1201          Also copy constantness arrays.   */
1202       for (edge = dst->callees; edge; edge = next)
1203         {
1204           struct predicate new_predicate;
1205           struct inline_edge_summary *es = inline_edge_summary (edge);
1206           next = edge->next_callee;
1207
1208           if (!edge->inline_failed)
1209             inlined_to_p = true;
1210           if (!es->predicate)
1211             continue;
1212           new_predicate = remap_predicate_after_duplication (es->predicate,
1213                                                              possible_truths,
1214                                                              info);
1215           if (false_predicate_p (&new_predicate)
1216               && !false_predicate_p (es->predicate))
1217             optimized_out_size += es->call_stmt_size * INLINE_SIZE_SCALE;
1218           edge_set_predicate (edge, &new_predicate);
1219         }
1220
1221       /* Remap indirect edge predicates with the same simplificaiton as above.
1222          Also copy constantness arrays.   */
1223       for (edge = dst->indirect_calls; edge; edge = next)
1224         {
1225           struct predicate new_predicate;
1226           struct inline_edge_summary *es = inline_edge_summary (edge);
1227           next = edge->next_callee;
1228
1229           gcc_checking_assert (edge->inline_failed);
1230           if (!es->predicate)
1231             continue;
1232           new_predicate = remap_predicate_after_duplication (es->predicate,
1233                                                              possible_truths,
1234                                                              info);
1235           if (false_predicate_p (&new_predicate)
1236               && !false_predicate_p (es->predicate))
1237             optimized_out_size += es->call_stmt_size * INLINE_SIZE_SCALE;
1238           edge_set_predicate (edge, &new_predicate);
1239         }
1240       remap_hint_predicate_after_duplication (&info->loop_iterations,
1241                                               possible_truths, info);
1242       remap_hint_predicate_after_duplication (&info->loop_stride,
1243                                               possible_truths, info);
1244       remap_hint_predicate_after_duplication (&info->array_index,
1245                                               possible_truths, info);
1246
1247       /* If inliner or someone after inliner will ever start producing
1248          non-trivial clones, we will get trouble with lack of information
1249          about updating self sizes, because size vectors already contains
1250          sizes of the calees.  */
1251       gcc_assert (!inlined_to_p || !optimized_out_size);
1252     }
1253   else
1254     {
1255       info->entry = vec_safe_copy (info->entry);
1256       if (info->loop_iterations)
1257         {
1258           predicate p = *info->loop_iterations;
1259           info->loop_iterations = NULL;
1260           set_hint_predicate (&info->loop_iterations, p);
1261         }
1262       if (info->loop_stride)
1263         {
1264           predicate p = *info->loop_stride;
1265           info->loop_stride = NULL;
1266           set_hint_predicate (&info->loop_stride, p);
1267         }
1268       if (info->array_index)
1269         {
1270           predicate p = *info->array_index;
1271           info->array_index = NULL;
1272           set_hint_predicate (&info->array_index, p);
1273         }
1274     }
1275   if (!dst->global.inlined_to)
1276     inline_update_overall_summary (dst);
1277 }
1278
1279
1280 /* Hook that is called by cgraph.c when a node is duplicated.  */
1281
1282 static void
1283 inline_edge_duplication_hook (struct cgraph_edge *src,
1284                               struct cgraph_edge *dst,
1285                               ATTRIBUTE_UNUSED void *data)
1286 {
1287   struct inline_edge_summary *info;
1288   struct inline_edge_summary *srcinfo;
1289   inline_summary_alloc ();
1290   info = inline_edge_summary (dst);
1291   srcinfo = inline_edge_summary (src);
1292   memcpy (info, srcinfo, sizeof (struct inline_edge_summary));
1293   info->predicate = NULL;
1294   edge_set_predicate (dst, srcinfo->predicate);
1295   info->param = srcinfo->param.copy ();
1296   if (!dst->indirect_unknown_callee && src->indirect_unknown_callee)
1297     {
1298       info->call_stmt_size -= (eni_size_weights.indirect_call_cost
1299                                - eni_size_weights.call_cost);
1300       info->call_stmt_time -= (eni_time_weights.indirect_call_cost
1301                                - eni_time_weights.call_cost);
1302     }
1303 }
1304
1305
1306 /* Keep edge cache consistent across edge removal.  */
1307
1308 static void
1309 inline_edge_removal_hook (struct cgraph_edge *edge,
1310                           void *data ATTRIBUTE_UNUSED)
1311 {
1312   if (edge_growth_cache.exists ())
1313     reset_edge_growth_cache (edge);
1314   reset_inline_edge_summary (edge);
1315 }
1316
1317
1318 /* Initialize growth caches.  */
1319
1320 void
1321 initialize_growth_caches (void)
1322 {
1323   if (symtab->edges_max_uid)
1324     edge_growth_cache.safe_grow_cleared (symtab->edges_max_uid);
1325 }
1326
1327
1328 /* Free growth caches.  */
1329
1330 void
1331 free_growth_caches (void)
1332 {
1333   edge_growth_cache.release ();
1334 }
1335
1336
1337 /* Dump edge summaries associated to NODE and recursively to all clones.
1338    Indent by INDENT.  */
1339
1340 static void
1341 dump_inline_edge_summary (FILE *f, int indent, struct cgraph_node *node,
1342                           struct inline_summary *info)
1343 {
1344   struct cgraph_edge *edge;
1345   for (edge = node->callees; edge; edge = edge->next_callee)
1346     {
1347       struct inline_edge_summary *es = inline_edge_summary (edge);
1348       struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
1349       int i;
1350
1351       fprintf (f,
1352                "%*s%s/%i %s\n%*s  loop depth:%2i freq:%4i size:%2i"
1353                " time: %2i callee size:%2i stack:%2i",
1354                indent, "", callee->name (), callee->order,
1355                !edge->inline_failed
1356                ? "inlined" : cgraph_inline_failed_string (edge-> inline_failed),
1357                indent, "", es->loop_depth, edge->frequency,
1358                es->call_stmt_size, es->call_stmt_time,
1359                (int) inline_summaries->get (callee)->size / INLINE_SIZE_SCALE,
1360                (int) inline_summaries->get (callee)->estimated_stack_size);
1361
1362       if (es->predicate)
1363         {
1364           fprintf (f, " predicate: ");
1365           dump_predicate (f, info->conds, es->predicate);
1366         }
1367       else
1368         fprintf (f, "\n");
1369       if (es->param.exists ())
1370         for (i = 0; i < (int) es->param.length (); i++)
1371           {
1372             int prob = es->param[i].change_prob;
1373
1374             if (!prob)
1375               fprintf (f, "%*s op%i is compile time invariant\n",
1376                        indent + 2, "", i);
1377             else if (prob != REG_BR_PROB_BASE)
1378               fprintf (f, "%*s op%i change %f%% of time\n", indent + 2, "", i,
1379                        prob * 100.0 / REG_BR_PROB_BASE);
1380           }
1381       if (!edge->inline_failed)
1382         {
1383           fprintf (f, "%*sStack frame offset %i, callee self size %i,"
1384                    " callee size %i\n",
1385                    indent + 2, "",
1386                    (int) inline_summaries->get (callee)->stack_frame_offset,
1387                    (int) inline_summaries->get (callee)->estimated_self_stack_size,
1388                    (int) inline_summaries->get (callee)->estimated_stack_size);
1389           dump_inline_edge_summary (f, indent + 2, callee, info);
1390         }
1391     }
1392   for (edge = node->indirect_calls; edge; edge = edge->next_callee)
1393     {
1394       struct inline_edge_summary *es = inline_edge_summary (edge);
1395       fprintf (f, "%*sindirect call loop depth:%2i freq:%4i size:%2i"
1396                " time: %2i",
1397                indent, "",
1398                es->loop_depth,
1399                edge->frequency, es->call_stmt_size, es->call_stmt_time);
1400       if (es->predicate)
1401         {
1402           fprintf (f, "predicate: ");
1403           dump_predicate (f, info->conds, es->predicate);
1404         }
1405       else
1406         fprintf (f, "\n");
1407     }
1408 }
1409
1410
1411 void
1412 dump_inline_summary (FILE *f, struct cgraph_node *node)
1413 {
1414   if (node->definition)
1415     {
1416       struct inline_summary *s = inline_summaries->get (node);
1417       size_time_entry *e;
1418       int i;
1419       fprintf (f, "Inline summary for %s/%i", node->name (),
1420                node->order);
1421       if (DECL_DISREGARD_INLINE_LIMITS (node->decl))
1422         fprintf (f, " always_inline");
1423       if (s->inlinable)
1424         fprintf (f, " inlinable");
1425       if (s->contains_cilk_spawn)
1426         fprintf (f, " contains_cilk_spawn");
1427       if (s->fp_expressions)
1428         fprintf (f, " fp_expression");
1429       fprintf (f, "\n  self time:       %i\n", s->self_time);
1430       fprintf (f, "  global time:     %i\n", s->time);
1431       fprintf (f, "  self size:       %i\n", s->self_size);
1432       fprintf (f, "  global size:     %i\n", s->size);
1433       fprintf (f, "  min size:       %i\n", s->min_size);
1434       fprintf (f, "  self stack:      %i\n",
1435                (int) s->estimated_self_stack_size);
1436       fprintf (f, "  global stack:    %i\n", (int) s->estimated_stack_size);
1437       if (s->growth)
1438         fprintf (f, "  estimated growth:%i\n", (int) s->growth);
1439       if (s->scc_no)
1440         fprintf (f, "  In SCC:          %i\n", (int) s->scc_no);
1441       for (i = 0; vec_safe_iterate (s->entry, i, &e); i++)
1442         {
1443           fprintf (f, "    size:%f, time:%f, predicate:",
1444                    (double) e->size / INLINE_SIZE_SCALE,
1445                    (double) e->time / INLINE_TIME_SCALE);
1446           dump_predicate (f, s->conds, &e->predicate);
1447         }
1448       if (s->loop_iterations)
1449         {
1450           fprintf (f, "  loop iterations:");
1451           dump_predicate (f, s->conds, s->loop_iterations);
1452         }
1453       if (s->loop_stride)
1454         {
1455           fprintf (f, "  loop stride:");
1456           dump_predicate (f, s->conds, s->loop_stride);
1457         }
1458       if (s->array_index)
1459         {
1460           fprintf (f, "  array index:");
1461           dump_predicate (f, s->conds, s->array_index);
1462         }
1463       fprintf (f, "  calls:\n");
1464       dump_inline_edge_summary (f, 4, node, s);
1465       fprintf (f, "\n");
1466     }
1467 }
1468
1469 DEBUG_FUNCTION void
1470 debug_inline_summary (struct cgraph_node *node)
1471 {
1472   dump_inline_summary (stderr, node);
1473 }
1474
1475 void
1476 dump_inline_summaries (FILE *f)
1477 {
1478   struct cgraph_node *node;
1479
1480   FOR_EACH_DEFINED_FUNCTION (node)
1481     if (!node->global.inlined_to)
1482       dump_inline_summary (f, node);
1483 }
1484
1485 /* Give initial reasons why inlining would fail on EDGE.  This gets either
1486    nullified or usually overwritten by more precise reasons later.  */
1487
1488 void
1489 initialize_inline_failed (struct cgraph_edge *e)
1490 {
1491   struct cgraph_node *callee = e->callee;
1492
1493   if (e->inline_failed && e->inline_failed != CIF_BODY_NOT_AVAILABLE
1494       && cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
1495     ;
1496   else if (e->indirect_unknown_callee)
1497     e->inline_failed = CIF_INDIRECT_UNKNOWN_CALL;
1498   else if (!callee->definition)
1499     e->inline_failed = CIF_BODY_NOT_AVAILABLE;
1500   else if (callee->local.redefined_extern_inline)
1501     e->inline_failed = CIF_REDEFINED_EXTERN_INLINE;
1502   else if (cfun && fn_contains_cilk_spawn_p (cfun))
1503     /* We can't inline if the function is spawing a function.  */
1504     e->inline_failed = CIF_CILK_SPAWN;
1505   else
1506     e->inline_failed = CIF_FUNCTION_NOT_CONSIDERED;
1507   gcc_checking_assert (!e->call_stmt_cannot_inline_p
1508                        || cgraph_inline_failed_type (e->inline_failed)
1509                             == CIF_FINAL_ERROR);
1510 }
1511
1512 /* Callback of walk_aliased_vdefs.  Flags that it has been invoked to the
1513    boolean variable pointed to by DATA.  */
1514
1515 static bool
1516 mark_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef ATTRIBUTE_UNUSED,
1517                void *data)
1518 {
1519   bool *b = (bool *) data;
1520   *b = true;
1521   return true;
1522 }
1523
1524 /* If OP refers to value of function parameter, return the corresponding
1525    parameter.  */
1526
1527 static tree
1528 unmodified_parm_1 (gimple *stmt, tree op)
1529 {
1530   /* SSA_NAME referring to parm default def?  */
1531   if (TREE_CODE (op) == SSA_NAME
1532       && SSA_NAME_IS_DEFAULT_DEF (op)
1533       && TREE_CODE (SSA_NAME_VAR (op)) == PARM_DECL)
1534     return SSA_NAME_VAR (op);
1535   /* Non-SSA parm reference?  */
1536   if (TREE_CODE (op) == PARM_DECL)
1537     {
1538       bool modified = false;
1539
1540       ao_ref refd;
1541       ao_ref_init (&refd, op);
1542       walk_aliased_vdefs (&refd, gimple_vuse (stmt), mark_modified, &modified,
1543                           NULL);
1544       if (!modified)
1545         return op;
1546     }
1547   return NULL_TREE;
1548 }
1549
1550 /* If OP refers to value of function parameter, return the corresponding
1551    parameter.  Also traverse chains of SSA register assignments.  */
1552
1553 static tree
1554 unmodified_parm (gimple *stmt, tree op)
1555 {
1556   tree res = unmodified_parm_1 (stmt, op);
1557   if (res)
1558     return res;
1559
1560   if (TREE_CODE (op) == SSA_NAME
1561       && !SSA_NAME_IS_DEFAULT_DEF (op)
1562       && gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1563     return unmodified_parm (SSA_NAME_DEF_STMT (op),
1564                             gimple_assign_rhs1 (SSA_NAME_DEF_STMT (op)));
1565   return NULL_TREE;
1566 }
1567
1568 /* If OP refers to a value of a function parameter or value loaded from an
1569    aggregate passed to a parameter (either by value or reference), return TRUE
1570    and store the number of the parameter to *INDEX_P and information whether
1571    and how it has been loaded from an aggregate into *AGGPOS.  INFO describes
1572    the function parameters, STMT is the statement in which OP is used or
1573    loaded.  */
1574
1575 static bool
1576 unmodified_parm_or_parm_agg_item (struct ipa_func_body_info *fbi,
1577                                   gimple *stmt, tree op, int *index_p,
1578                                   struct agg_position_info *aggpos)
1579 {
1580   tree res = unmodified_parm_1 (stmt, op);
1581
1582   gcc_checking_assert (aggpos);
1583   if (res)
1584     {
1585       *index_p = ipa_get_param_decl_index (fbi->info, res);
1586       if (*index_p < 0)
1587         return false;
1588       aggpos->agg_contents = false;
1589       aggpos->by_ref = false;
1590       return true;
1591     }
1592
1593   if (TREE_CODE (op) == SSA_NAME)
1594     {
1595       if (SSA_NAME_IS_DEFAULT_DEF (op)
1596           || !gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1597         return false;
1598       stmt = SSA_NAME_DEF_STMT (op);
1599       op = gimple_assign_rhs1 (stmt);
1600       if (!REFERENCE_CLASS_P (op))
1601         return unmodified_parm_or_parm_agg_item (fbi, stmt, op, index_p,
1602                                                  aggpos);
1603     }
1604
1605   aggpos->agg_contents = true;
1606   return ipa_load_from_parm_agg (fbi, fbi->info->descriptors,
1607                                  stmt, op, index_p, &aggpos->offset,
1608                                  NULL, &aggpos->by_ref);
1609 }
1610
1611 /* See if statement might disappear after inlining.
1612    0 - means not eliminated
1613    1 - half of statements goes away
1614    2 - for sure it is eliminated.
1615    We are not terribly sophisticated, basically looking for simple abstraction
1616    penalty wrappers.  */
1617
1618 static int
1619 eliminated_by_inlining_prob (gimple *stmt)
1620 {
1621   enum gimple_code code = gimple_code (stmt);
1622   enum tree_code rhs_code;
1623
1624   if (!optimize)
1625     return 0;
1626
1627   switch (code)
1628     {
1629     case GIMPLE_RETURN:
1630       return 2;
1631     case GIMPLE_ASSIGN:
1632       if (gimple_num_ops (stmt) != 2)
1633         return 0;
1634
1635       rhs_code = gimple_assign_rhs_code (stmt);
1636
1637       /* Casts of parameters, loads from parameters passed by reference
1638          and stores to return value or parameters are often free after
1639          inlining dua to SRA and further combining.
1640          Assume that half of statements goes away.  */
1641       if (CONVERT_EXPR_CODE_P (rhs_code)
1642           || rhs_code == VIEW_CONVERT_EXPR
1643           || rhs_code == ADDR_EXPR
1644           || gimple_assign_rhs_class (stmt) == GIMPLE_SINGLE_RHS)
1645         {
1646           tree rhs = gimple_assign_rhs1 (stmt);
1647           tree lhs = gimple_assign_lhs (stmt);
1648           tree inner_rhs = get_base_address (rhs);
1649           tree inner_lhs = get_base_address (lhs);
1650           bool rhs_free = false;
1651           bool lhs_free = false;
1652
1653           if (!inner_rhs)
1654             inner_rhs = rhs;
1655           if (!inner_lhs)
1656             inner_lhs = lhs;
1657
1658           /* Reads of parameter are expected to be free.  */
1659           if (unmodified_parm (stmt, inner_rhs))
1660             rhs_free = true;
1661           /* Match expressions of form &this->field. Those will most likely
1662              combine with something upstream after inlining.  */
1663           else if (TREE_CODE (inner_rhs) == ADDR_EXPR)
1664             {
1665               tree op = get_base_address (TREE_OPERAND (inner_rhs, 0));
1666               if (TREE_CODE (op) == PARM_DECL)
1667                 rhs_free = true;
1668               else if (TREE_CODE (op) == MEM_REF
1669                        && unmodified_parm (stmt, TREE_OPERAND (op, 0)))
1670                 rhs_free = true;
1671             }
1672
1673           /* When parameter is not SSA register because its address is taken
1674              and it is just copied into one, the statement will be completely
1675              free after inlining (we will copy propagate backward).   */
1676           if (rhs_free && is_gimple_reg (lhs))
1677             return 2;
1678
1679           /* Reads of parameters passed by reference
1680              expected to be free (i.e. optimized out after inlining).  */
1681           if (TREE_CODE (inner_rhs) == MEM_REF
1682               && unmodified_parm (stmt, TREE_OPERAND (inner_rhs, 0)))
1683             rhs_free = true;
1684
1685           /* Copying parameter passed by reference into gimple register is
1686              probably also going to copy propagate, but we can't be quite
1687              sure.  */
1688           if (rhs_free && is_gimple_reg (lhs))
1689             lhs_free = true;
1690
1691           /* Writes to parameters, parameters passed by value and return value
1692              (either dirrectly or passed via invisible reference) are free.
1693
1694              TODO: We ought to handle testcase like
1695              struct a {int a,b;};
1696              struct a
1697              retrurnsturct (void)
1698              {
1699              struct a a ={1,2};
1700              return a;
1701              }
1702
1703              This translate into:
1704
1705              retrurnsturct ()
1706              {
1707              int a$b;
1708              int a$a;
1709              struct a a;
1710              struct a D.2739;
1711
1712              <bb 2>:
1713              D.2739.a = 1;
1714              D.2739.b = 2;
1715              return D.2739;
1716
1717              }
1718              For that we either need to copy ipa-split logic detecting writes
1719              to return value.  */
1720           if (TREE_CODE (inner_lhs) == PARM_DECL
1721               || TREE_CODE (inner_lhs) == RESULT_DECL
1722               || (TREE_CODE (inner_lhs) == MEM_REF
1723                   && (unmodified_parm (stmt, TREE_OPERAND (inner_lhs, 0))
1724                       || (TREE_CODE (TREE_OPERAND (inner_lhs, 0)) == SSA_NAME
1725                           && SSA_NAME_VAR (TREE_OPERAND (inner_lhs, 0))
1726                           && TREE_CODE (SSA_NAME_VAR (TREE_OPERAND
1727                                                       (inner_lhs,
1728                                                        0))) == RESULT_DECL))))
1729             lhs_free = true;
1730           if (lhs_free
1731               && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
1732             rhs_free = true;
1733           if (lhs_free && rhs_free)
1734             return 1;
1735         }
1736       return 0;
1737     default:
1738       return 0;
1739     }
1740 }
1741
1742
1743 /* If BB ends by a conditional we can turn into predicates, attach corresponding
1744    predicates to the CFG edges.   */
1745
1746 static void
1747 set_cond_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1748                                    struct inline_summary *summary,
1749                                    basic_block bb)
1750 {
1751   gimple *last;
1752   tree op;
1753   int index;
1754   struct agg_position_info aggpos;
1755   enum tree_code code, inverted_code;
1756   edge e;
1757   edge_iterator ei;
1758   gimple *set_stmt;
1759   tree op2;
1760
1761   last = last_stmt (bb);
1762   if (!last || gimple_code (last) != GIMPLE_COND)
1763     return;
1764   if (!is_gimple_ip_invariant (gimple_cond_rhs (last)))
1765     return;
1766   op = gimple_cond_lhs (last);
1767   /* TODO: handle conditionals like
1768      var = op0 < 4;
1769      if (var != 0).  */
1770   if (unmodified_parm_or_parm_agg_item (fbi, last, op, &index, &aggpos))
1771     {
1772       code = gimple_cond_code (last);
1773       inverted_code = invert_tree_comparison (code, HONOR_NANS (op));
1774
1775       FOR_EACH_EDGE (e, ei, bb->succs)
1776         {
1777           enum tree_code this_code = (e->flags & EDGE_TRUE_VALUE
1778                                       ? code : inverted_code);
1779           /* invert_tree_comparison will return ERROR_MARK on FP
1780              comparsions that are not EQ/NE instead of returning proper
1781              unordered one.  Be sure it is not confused with NON_CONSTANT.  */
1782           if (this_code != ERROR_MARK)
1783             {
1784               struct predicate p = add_condition
1785                  (summary, index, &aggpos, this_code,
1786                   unshare_expr_without_location (gimple_cond_rhs (last)));
1787               e->aux = edge_predicate_pool.allocate ();
1788               *(struct predicate *) e->aux = p;
1789             }
1790         }
1791     }
1792
1793   if (TREE_CODE (op) != SSA_NAME)
1794     return;
1795   /* Special case
1796      if (builtin_constant_p (op))
1797      constant_code
1798      else
1799      nonconstant_code.
1800      Here we can predicate nonconstant_code.  We can't
1801      really handle constant_code since we have no predicate
1802      for this and also the constant code is not known to be
1803      optimized away when inliner doen't see operand is constant.
1804      Other optimizers might think otherwise.  */
1805   if (gimple_cond_code (last) != NE_EXPR
1806       || !integer_zerop (gimple_cond_rhs (last)))
1807     return;
1808   set_stmt = SSA_NAME_DEF_STMT (op);
1809   if (!gimple_call_builtin_p (set_stmt, BUILT_IN_CONSTANT_P)
1810       || gimple_call_num_args (set_stmt) != 1)
1811     return;
1812   op2 = gimple_call_arg (set_stmt, 0);
1813   if (!unmodified_parm_or_parm_agg_item (fbi, set_stmt, op2, &index, &aggpos))
1814     return;
1815   FOR_EACH_EDGE (e, ei, bb->succs) if (e->flags & EDGE_FALSE_VALUE)
1816     {
1817       struct predicate p = add_condition (summary, index, &aggpos,
1818                                           IS_NOT_CONSTANT, NULL_TREE);
1819       e->aux = edge_predicate_pool.allocate ();
1820       *(struct predicate *) e->aux = p;
1821     }
1822 }
1823
1824
1825 /* If BB ends by a switch we can turn into predicates, attach corresponding
1826    predicates to the CFG edges.   */
1827
1828 static void
1829 set_switch_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1830                                      struct inline_summary *summary,
1831                                      basic_block bb)
1832 {
1833   gimple *lastg;
1834   tree op;
1835   int index;
1836   struct agg_position_info aggpos;
1837   edge e;
1838   edge_iterator ei;
1839   size_t n;
1840   size_t case_idx;
1841
1842   lastg = last_stmt (bb);
1843   if (!lastg || gimple_code (lastg) != GIMPLE_SWITCH)
1844     return;
1845   gswitch *last = as_a <gswitch *> (lastg);
1846   op = gimple_switch_index (last);
1847   if (!unmodified_parm_or_parm_agg_item (fbi, last, op, &index, &aggpos))
1848     return;
1849
1850   FOR_EACH_EDGE (e, ei, bb->succs)
1851     {
1852       e->aux = edge_predicate_pool.allocate ();
1853       *(struct predicate *) e->aux = false_predicate ();
1854     }
1855   n = gimple_switch_num_labels (last);
1856   for (case_idx = 0; case_idx < n; ++case_idx)
1857     {
1858       tree cl = gimple_switch_label (last, case_idx);
1859       tree min, max;
1860       struct predicate p;
1861
1862       e = find_edge (bb, label_to_block (CASE_LABEL (cl)));
1863       min = CASE_LOW (cl);
1864       max = CASE_HIGH (cl);
1865
1866       /* For default we might want to construct predicate that none
1867          of cases is met, but it is bit hard to do not having negations
1868          of conditionals handy.  */
1869       if (!min && !max)
1870         p = true_predicate ();
1871       else if (!max)
1872         p = add_condition (summary, index, &aggpos, EQ_EXPR,
1873                            unshare_expr_without_location (min));
1874       else
1875         {
1876           struct predicate p1, p2;
1877           p1 = add_condition (summary, index, &aggpos, GE_EXPR,
1878                               unshare_expr_without_location (min));
1879           p2 = add_condition (summary, index, &aggpos, LE_EXPR,
1880                               unshare_expr_without_location (max));
1881           p = and_predicates (summary->conds, &p1, &p2);
1882         }
1883       *(struct predicate *) e->aux
1884         = or_predicates (summary->conds, &p, (struct predicate *) e->aux);
1885     }
1886 }
1887
1888
1889 /* For each BB in NODE attach to its AUX pointer predicate under
1890    which it is executable.  */
1891
1892 static void
1893 compute_bb_predicates (struct ipa_func_body_info *fbi,
1894                        struct cgraph_node *node,
1895                        struct inline_summary *summary)
1896 {
1897   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
1898   bool done = false;
1899   basic_block bb;
1900
1901   FOR_EACH_BB_FN (bb, my_function)
1902     {
1903       set_cond_stmt_execution_predicate (fbi, summary, bb);
1904       set_switch_stmt_execution_predicate (fbi, summary, bb);
1905     }
1906
1907   /* Entry block is always executable.  */
1908   ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux
1909     = edge_predicate_pool.allocate ();
1910   *(struct predicate *) ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux
1911     = true_predicate ();
1912
1913   /* A simple dataflow propagation of predicates forward in the CFG.
1914      TODO: work in reverse postorder.  */
1915   while (!done)
1916     {
1917       done = true;
1918       FOR_EACH_BB_FN (bb, my_function)
1919         {
1920           struct predicate p = false_predicate ();
1921           edge e;
1922           edge_iterator ei;
1923           FOR_EACH_EDGE (e, ei, bb->preds)
1924             {
1925               if (e->src->aux)
1926                 {
1927                   struct predicate this_bb_predicate
1928                     = *(struct predicate *) e->src->aux;
1929                   if (e->aux)
1930                     this_bb_predicate
1931                       = and_predicates (summary->conds, &this_bb_predicate,
1932                                         (struct predicate *) e->aux);
1933                   p = or_predicates (summary->conds, &p, &this_bb_predicate);
1934                   if (true_predicate_p (&p))
1935                     break;
1936                 }
1937             }
1938           if (false_predicate_p (&p))
1939             gcc_assert (!bb->aux);
1940           else
1941             {
1942               if (!bb->aux)
1943                 {
1944                   done = false;
1945                   bb->aux = edge_predicate_pool.allocate ();
1946                   *((struct predicate *) bb->aux) = p;
1947                 }
1948               else if (!predicates_equal_p (&p, (struct predicate *) bb->aux))
1949                 {
1950                   /* This OR operation is needed to ensure monotonous data flow
1951                      in the case we hit the limit on number of clauses and the
1952                      and/or operations above give approximate answers.  */
1953                   p = or_predicates (summary->conds, &p, (struct predicate *)bb->aux);
1954                   if (!predicates_equal_p (&p, (struct predicate *) bb->aux))
1955                     {
1956                       done = false;
1957                       *((struct predicate *) bb->aux) = p;
1958                     }
1959                 }
1960             }
1961         }
1962     }
1963 }
1964
1965
1966 /* We keep info about constantness of SSA names.  */
1967
1968 typedef struct predicate predicate_t;
1969 /* Return predicate specifying when the STMT might have result that is not
1970    a compile time constant.  */
1971
1972 static struct predicate
1973 will_be_nonconstant_expr_predicate (struct ipa_node_params *info,
1974                                     struct inline_summary *summary,
1975                                     tree expr,
1976                                     vec<predicate_t> nonconstant_names)
1977 {
1978   tree parm;
1979   int index;
1980
1981   while (UNARY_CLASS_P (expr))
1982     expr = TREE_OPERAND (expr, 0);
1983
1984   parm = unmodified_parm (NULL, expr);
1985   if (parm && (index = ipa_get_param_decl_index (info, parm)) >= 0)
1986     return add_condition (summary, index, NULL, CHANGED, NULL_TREE);
1987   if (is_gimple_min_invariant (expr))
1988     return false_predicate ();
1989   if (TREE_CODE (expr) == SSA_NAME)
1990     return nonconstant_names[SSA_NAME_VERSION (expr)];
1991   if (BINARY_CLASS_P (expr) || COMPARISON_CLASS_P (expr))
1992     {
1993       struct predicate p1 = will_be_nonconstant_expr_predicate
1994         (info, summary, TREE_OPERAND (expr, 0),
1995          nonconstant_names);
1996       struct predicate p2;
1997       if (true_predicate_p (&p1))
1998         return p1;
1999       p2 = will_be_nonconstant_expr_predicate (info, summary,
2000                                                TREE_OPERAND (expr, 1),
2001                                                nonconstant_names);
2002       return or_predicates (summary->conds, &p1, &p2);
2003     }
2004   else if (TREE_CODE (expr) == COND_EXPR)
2005     {
2006       struct predicate p1 = will_be_nonconstant_expr_predicate
2007         (info, summary, TREE_OPERAND (expr, 0),
2008          nonconstant_names);
2009       struct predicate p2;
2010       if (true_predicate_p (&p1))
2011         return p1;
2012       p2 = will_be_nonconstant_expr_predicate (info, summary,
2013                                                TREE_OPERAND (expr, 1),
2014                                                nonconstant_names);
2015       if (true_predicate_p (&p2))
2016         return p2;
2017       p1 = or_predicates (summary->conds, &p1, &p2);
2018       p2 = will_be_nonconstant_expr_predicate (info, summary,
2019                                                TREE_OPERAND (expr, 2),
2020                                                nonconstant_names);
2021       return or_predicates (summary->conds, &p1, &p2);
2022     }
2023   else
2024     {
2025       debug_tree (expr);
2026       gcc_unreachable ();
2027     }
2028   return false_predicate ();
2029 }
2030
2031
2032 /* Return predicate specifying when the STMT might have result that is not
2033    a compile time constant.  */
2034
2035 static struct predicate
2036 will_be_nonconstant_predicate (struct ipa_func_body_info *fbi,
2037                                struct inline_summary *summary,
2038                                gimple *stmt,
2039                                vec<predicate_t> nonconstant_names)
2040 {
2041   struct predicate p = true_predicate ();
2042   ssa_op_iter iter;
2043   tree use;
2044   struct predicate op_non_const;
2045   bool is_load;
2046   int base_index;
2047   struct agg_position_info aggpos;
2048
2049   /* What statments might be optimized away
2050      when their arguments are constant.  */
2051   if (gimple_code (stmt) != GIMPLE_ASSIGN
2052       && gimple_code (stmt) != GIMPLE_COND
2053       && gimple_code (stmt) != GIMPLE_SWITCH
2054       && (gimple_code (stmt) != GIMPLE_CALL
2055           || !(gimple_call_flags (stmt) & ECF_CONST)))
2056     return p;
2057
2058   /* Stores will stay anyway.  */
2059   if (gimple_store_p (stmt))
2060     return p;
2061
2062   is_load = gimple_assign_load_p (stmt);
2063
2064   /* Loads can be optimized when the value is known.  */
2065   if (is_load)
2066     {
2067       tree op;
2068       gcc_assert (gimple_assign_single_p (stmt));
2069       op = gimple_assign_rhs1 (stmt);
2070       if (!unmodified_parm_or_parm_agg_item (fbi, stmt, op, &base_index,
2071                                              &aggpos))
2072         return p;
2073     }
2074   else
2075     base_index = -1;
2076
2077   /* See if we understand all operands before we start
2078      adding conditionals.  */
2079   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2080     {
2081       tree parm = unmodified_parm (stmt, use);
2082       /* For arguments we can build a condition.  */
2083       if (parm && ipa_get_param_decl_index (fbi->info, parm) >= 0)
2084         continue;
2085       if (TREE_CODE (use) != SSA_NAME)
2086         return p;
2087       /* If we know when operand is constant,
2088          we still can say something useful.  */
2089       if (!true_predicate_p (&nonconstant_names[SSA_NAME_VERSION (use)]))
2090         continue;
2091       return p;
2092     }
2093
2094   if (is_load)
2095     op_non_const =
2096       add_condition (summary, base_index, &aggpos, CHANGED, NULL);
2097   else
2098     op_non_const = false_predicate ();
2099   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2100     {
2101       tree parm = unmodified_parm (stmt, use);
2102       int index;
2103
2104       if (parm && (index = ipa_get_param_decl_index (fbi->info, parm)) >= 0)
2105         {
2106           if (index != base_index)
2107             p = add_condition (summary, index, NULL, CHANGED, NULL_TREE);
2108           else
2109             continue;
2110         }
2111       else
2112         p = nonconstant_names[SSA_NAME_VERSION (use)];
2113       op_non_const = or_predicates (summary->conds, &p, &op_non_const);
2114     }
2115   if ((gimple_code (stmt) == GIMPLE_ASSIGN || gimple_code (stmt) == GIMPLE_CALL)
2116       && gimple_op (stmt, 0)
2117       && TREE_CODE (gimple_op (stmt, 0)) == SSA_NAME)
2118     nonconstant_names[SSA_NAME_VERSION (gimple_op (stmt, 0))]
2119       = op_non_const;
2120   return op_non_const;
2121 }
2122
2123 struct record_modified_bb_info
2124 {
2125   bitmap bb_set;
2126   gimple *stmt;
2127 };
2128
2129 /* Callback of walk_aliased_vdefs.  Records basic blocks where the value may be
2130    set except for info->stmt.  */
2131
2132 static bool
2133 record_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef, void *data)
2134 {
2135   struct record_modified_bb_info *info =
2136     (struct record_modified_bb_info *) data;
2137   if (SSA_NAME_DEF_STMT (vdef) == info->stmt)
2138     return false;
2139   bitmap_set_bit (info->bb_set,
2140                   SSA_NAME_IS_DEFAULT_DEF (vdef)
2141                   ? ENTRY_BLOCK_PTR_FOR_FN (cfun)->index
2142                   : gimple_bb (SSA_NAME_DEF_STMT (vdef))->index);
2143   return false;
2144 }
2145
2146 /* Return probability (based on REG_BR_PROB_BASE) that I-th parameter of STMT
2147    will change since last invocation of STMT.
2148
2149    Value 0 is reserved for compile time invariants.
2150    For common parameters it is REG_BR_PROB_BASE.  For loop invariants it
2151    ought to be REG_BR_PROB_BASE / estimated_iters.  */
2152
2153 static int
2154 param_change_prob (gimple *stmt, int i)
2155 {
2156   tree op = gimple_call_arg (stmt, i);
2157   basic_block bb = gimple_bb (stmt);
2158   tree base;
2159
2160   /* Global invariants neve change.  */
2161   if (is_gimple_min_invariant (op))
2162     return 0;
2163   /* We would have to do non-trivial analysis to really work out what
2164      is the probability of value to change (i.e. when init statement
2165      is in a sibling loop of the call).
2166
2167      We do an conservative estimate: when call is executed N times more often
2168      than the statement defining value, we take the frequency 1/N.  */
2169   if (TREE_CODE (op) == SSA_NAME)
2170     {
2171       int init_freq;
2172
2173       if (!bb->frequency)
2174         return REG_BR_PROB_BASE;
2175
2176       if (SSA_NAME_IS_DEFAULT_DEF (op))
2177         init_freq = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
2178       else
2179         init_freq = gimple_bb (SSA_NAME_DEF_STMT (op))->frequency;
2180
2181       if (!init_freq)
2182         init_freq = 1;
2183       if (init_freq < bb->frequency)
2184         return MAX (GCOV_COMPUTE_SCALE (init_freq, bb->frequency), 1);
2185       else
2186         return REG_BR_PROB_BASE;
2187     }
2188
2189   base = get_base_address (op);
2190   if (base)
2191     {
2192       ao_ref refd;
2193       int max;
2194       struct record_modified_bb_info info;
2195       bitmap_iterator bi;
2196       unsigned index;
2197       tree init = ctor_for_folding (base);
2198
2199       if (init != error_mark_node)
2200         return 0;
2201       if (!bb->frequency)
2202         return REG_BR_PROB_BASE;
2203       ao_ref_init (&refd, op);
2204       info.stmt = stmt;
2205       info.bb_set = BITMAP_ALLOC (NULL);
2206       walk_aliased_vdefs (&refd, gimple_vuse (stmt), record_modified, &info,
2207                           NULL);
2208       if (bitmap_bit_p (info.bb_set, bb->index))
2209         {
2210           BITMAP_FREE (info.bb_set);
2211           return REG_BR_PROB_BASE;
2212         }
2213
2214       /* Assume that every memory is initialized at entry.
2215          TODO: Can we easilly determine if value is always defined
2216          and thus we may skip entry block?  */
2217       if (ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency)
2218         max = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
2219       else
2220         max = 1;
2221
2222       EXECUTE_IF_SET_IN_BITMAP (info.bb_set, 0, index, bi)
2223         max = MIN (max, BASIC_BLOCK_FOR_FN (cfun, index)->frequency);
2224
2225       BITMAP_FREE (info.bb_set);
2226       if (max < bb->frequency)
2227         return MAX (GCOV_COMPUTE_SCALE (max, bb->frequency), 1);
2228       else
2229         return REG_BR_PROB_BASE;
2230     }
2231   return REG_BR_PROB_BASE;
2232 }
2233
2234 /* Find whether a basic block BB is the final block of a (half) diamond CFG
2235    sub-graph and if the predicate the condition depends on is known.  If so,
2236    return true and store the pointer the predicate in *P.  */
2237
2238 static bool
2239 phi_result_unknown_predicate (struct ipa_node_params *info,
2240                               inline_summary *summary, basic_block bb,
2241                               struct predicate *p,
2242                               vec<predicate_t> nonconstant_names)
2243 {
2244   edge e;
2245   edge_iterator ei;
2246   basic_block first_bb = NULL;
2247   gimple *stmt;
2248
2249   if (single_pred_p (bb))
2250     {
2251       *p = false_predicate ();
2252       return true;
2253     }
2254
2255   FOR_EACH_EDGE (e, ei, bb->preds)
2256     {
2257       if (single_succ_p (e->src))
2258         {
2259           if (!single_pred_p (e->src))
2260             return false;
2261           if (!first_bb)
2262             first_bb = single_pred (e->src);
2263           else if (single_pred (e->src) != first_bb)
2264             return false;
2265         }
2266       else
2267         {
2268           if (!first_bb)
2269             first_bb = e->src;
2270           else if (e->src != first_bb)
2271             return false;
2272         }
2273     }
2274
2275   if (!first_bb)
2276     return false;
2277
2278   stmt = last_stmt (first_bb);
2279   if (!stmt
2280       || gimple_code (stmt) != GIMPLE_COND
2281       || !is_gimple_ip_invariant (gimple_cond_rhs (stmt)))
2282     return false;
2283
2284   *p = will_be_nonconstant_expr_predicate (info, summary,
2285                                            gimple_cond_lhs (stmt),
2286                                            nonconstant_names);
2287   if (true_predicate_p (p))
2288     return false;
2289   else
2290     return true;
2291 }
2292
2293 /* Given a PHI statement in a function described by inline properties SUMMARY
2294    and *P being the predicate describing whether the selected PHI argument is
2295    known, store a predicate for the result of the PHI statement into
2296    NONCONSTANT_NAMES, if possible.  */
2297
2298 static void
2299 predicate_for_phi_result (struct inline_summary *summary, gphi *phi,
2300                           struct predicate *p,
2301                           vec<predicate_t> nonconstant_names)
2302 {
2303   unsigned i;
2304
2305   for (i = 0; i < gimple_phi_num_args (phi); i++)
2306     {
2307       tree arg = gimple_phi_arg (phi, i)->def;
2308       if (!is_gimple_min_invariant (arg))
2309         {
2310           gcc_assert (TREE_CODE (arg) == SSA_NAME);
2311           *p = or_predicates (summary->conds, p,
2312                               &nonconstant_names[SSA_NAME_VERSION (arg)]);
2313           if (true_predicate_p (p))
2314             return;
2315         }
2316     }
2317
2318   if (dump_file && (dump_flags & TDF_DETAILS))
2319     {
2320       fprintf (dump_file, "\t\tphi predicate: ");
2321       dump_predicate (dump_file, summary->conds, p);
2322     }
2323   nonconstant_names[SSA_NAME_VERSION (gimple_phi_result (phi))] = *p;
2324 }
2325
2326 /* Return predicate specifying when array index in access OP becomes non-constant.  */
2327
2328 static struct predicate
2329 array_index_predicate (inline_summary *info,
2330                        vec< predicate_t> nonconstant_names, tree op)
2331 {
2332   struct predicate p = false_predicate ();
2333   while (handled_component_p (op))
2334     {
2335       if (TREE_CODE (op) == ARRAY_REF || TREE_CODE (op) == ARRAY_RANGE_REF)
2336         {
2337           if (TREE_CODE (TREE_OPERAND (op, 1)) == SSA_NAME)
2338             p = or_predicates (info->conds, &p,
2339                                &nonconstant_names[SSA_NAME_VERSION
2340                                                   (TREE_OPERAND (op, 1))]);
2341         }
2342       op = TREE_OPERAND (op, 0);
2343     }
2344   return p;
2345 }
2346
2347 /* For a typical usage of __builtin_expect (a<b, 1), we
2348    may introduce an extra relation stmt:
2349    With the builtin, we have
2350      t1 = a <= b;
2351      t2 = (long int) t1;
2352      t3 = __builtin_expect (t2, 1);
2353      if (t3 != 0)
2354        goto ...
2355    Without the builtin, we have
2356      if (a<=b)
2357        goto...
2358    This affects the size/time estimation and may have
2359    an impact on the earlier inlining.
2360    Here find this pattern and fix it up later.  */
2361
2362 static gimple *
2363 find_foldable_builtin_expect (basic_block bb)
2364 {
2365   gimple_stmt_iterator bsi;
2366
2367   for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
2368     {
2369       gimple *stmt = gsi_stmt (bsi);
2370       if (gimple_call_builtin_p (stmt, BUILT_IN_EXPECT)
2371           || (is_gimple_call (stmt)
2372               && gimple_call_internal_p (stmt)
2373               && gimple_call_internal_fn (stmt) == IFN_BUILTIN_EXPECT))
2374         {
2375           tree var = gimple_call_lhs (stmt);
2376           tree arg = gimple_call_arg (stmt, 0);
2377           use_operand_p use_p;
2378           gimple *use_stmt;
2379           bool match = false;
2380           bool done = false;
2381
2382           if (!var || !arg)
2383             continue;
2384           gcc_assert (TREE_CODE (var) == SSA_NAME);
2385
2386           while (TREE_CODE (arg) == SSA_NAME)
2387             {
2388               gimple *stmt_tmp = SSA_NAME_DEF_STMT (arg);
2389               if (!is_gimple_assign (stmt_tmp))
2390                 break;
2391               switch (gimple_assign_rhs_code (stmt_tmp))
2392                 {
2393                   case LT_EXPR:
2394                   case LE_EXPR:
2395                   case GT_EXPR:
2396                   case GE_EXPR:
2397                   case EQ_EXPR:
2398                   case NE_EXPR:
2399                     match = true;
2400                     done = true;
2401                     break;
2402                   CASE_CONVERT:
2403                     break;
2404                   default:
2405                     done = true;
2406                     break;
2407                 }
2408               if (done)
2409                 break;
2410               arg = gimple_assign_rhs1 (stmt_tmp);
2411             }
2412
2413           if (match && single_imm_use (var, &use_p, &use_stmt)
2414               && gimple_code (use_stmt) == GIMPLE_COND)
2415             return use_stmt;
2416         }
2417     }
2418   return NULL;
2419 }
2420
2421 /* Return true when the basic blocks contains only clobbers followed by RESX.
2422    Such BBs are kept around to make removal of dead stores possible with
2423    presence of EH and will be optimized out by optimize_clobbers later in the
2424    game.
2425
2426    NEED_EH is used to recurse in case the clobber has non-EH predecestors
2427    that can be clobber only, too.. When it is false, the RESX is not necessary
2428    on the end of basic block.  */
2429
2430 static bool
2431 clobber_only_eh_bb_p (basic_block bb, bool need_eh = true)
2432 {
2433   gimple_stmt_iterator gsi = gsi_last_bb (bb);
2434   edge_iterator ei;
2435   edge e;
2436
2437   if (need_eh)
2438     {
2439       if (gsi_end_p (gsi))
2440         return false;
2441       if (gimple_code (gsi_stmt (gsi)) != GIMPLE_RESX)
2442         return false;
2443       gsi_prev (&gsi);
2444     }
2445   else if (!single_succ_p (bb))
2446     return false;
2447
2448   for (; !gsi_end_p (gsi); gsi_prev (&gsi))
2449     {
2450       gimple *stmt = gsi_stmt (gsi);
2451       if (is_gimple_debug (stmt))
2452         continue;
2453       if (gimple_clobber_p (stmt))
2454         continue;
2455       if (gimple_code (stmt) == GIMPLE_LABEL)
2456         break;
2457       return false;
2458     }
2459
2460   /* See if all predecestors are either throws or clobber only BBs.  */
2461   FOR_EACH_EDGE (e, ei, bb->preds)
2462     if (!(e->flags & EDGE_EH)
2463         && !clobber_only_eh_bb_p (e->src, false))
2464       return false;
2465
2466   return true;
2467 }
2468
2469 /* Return true if STMT compute a floating point expression that may be affected
2470    by -ffast-math and similar flags.  */
2471
2472 static bool
2473 fp_expression_p (gimple *stmt)
2474 {
2475   ssa_op_iter i;
2476   tree op;
2477
2478   FOR_EACH_SSA_TREE_OPERAND (op, stmt, i, SSA_OP_DEF|SSA_OP_USE)
2479     if (FLOAT_TYPE_P (TREE_TYPE (op)))
2480       return true;
2481   return false;
2482 }
2483
2484 /* Compute function body size parameters for NODE.
2485    When EARLY is true, we compute only simple summaries without
2486    non-trivial predicates to drive the early inliner.  */
2487
2488 static void
2489 estimate_function_body_sizes (struct cgraph_node *node, bool early)
2490 {
2491   gcov_type time = 0;
2492   /* Estimate static overhead for function prologue/epilogue and alignment. */
2493   int size = 2;
2494   /* Benefits are scaled by probability of elimination that is in range
2495      <0,2>.  */
2496   basic_block bb;
2497   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
2498   int freq;
2499   struct inline_summary *info = inline_summaries->get (node);
2500   struct predicate bb_predicate;
2501   struct ipa_func_body_info fbi;
2502   vec<predicate_t> nonconstant_names = vNULL;
2503   int nblocks, n;
2504   int *order;
2505   predicate array_index = true_predicate ();
2506   gimple *fix_builtin_expect_stmt;
2507
2508   gcc_assert (my_function && my_function->cfg);
2509   gcc_assert (cfun == my_function);
2510
2511   memset(&fbi, 0, sizeof(fbi));
2512   info->conds = NULL;
2513   info->entry = NULL;
2514
2515   /* When optimizing and analyzing for IPA inliner, initialize loop optimizer
2516      so we can produce proper inline hints.
2517
2518      When optimizing and analyzing for early inliner, initialize node params
2519      so we can produce correct BB predicates.  */
2520
2521   if (opt_for_fn (node->decl, optimize))
2522     {
2523       calculate_dominance_info (CDI_DOMINATORS);
2524       if (!early)
2525         loop_optimizer_init (LOOPS_NORMAL | LOOPS_HAVE_RECORDED_EXITS);
2526       else
2527         {
2528           ipa_check_create_node_params ();
2529           ipa_initialize_node_params (node);
2530         }
2531
2532       if (ipa_node_params_sum)
2533         {
2534           fbi.node = node;
2535           fbi.info = IPA_NODE_REF (node);
2536           fbi.bb_infos = vNULL;
2537           fbi.bb_infos.safe_grow_cleared (last_basic_block_for_fn (cfun));
2538           fbi.param_count = count_formal_params(node->decl);
2539           nonconstant_names.safe_grow_cleared
2540             (SSANAMES (my_function)->length ());
2541         }
2542     }
2543
2544   if (dump_file)
2545     fprintf (dump_file, "\nAnalyzing function body size: %s\n",
2546              node->name ());
2547
2548   /* When we run into maximal number of entries, we assign everything to the
2549      constant truth case.  Be sure to have it in list. */
2550   bb_predicate = true_predicate ();
2551   account_size_time (info, 0, 0, &bb_predicate);
2552
2553   bb_predicate = not_inlined_predicate ();
2554   account_size_time (info, 2 * INLINE_SIZE_SCALE, 0, &bb_predicate);
2555
2556   if (fbi.info)
2557     compute_bb_predicates (&fbi, node, info);
2558   order = XNEWVEC (int, n_basic_blocks_for_fn (cfun));
2559   nblocks = pre_and_rev_post_order_compute (NULL, order, false);
2560   for (n = 0; n < nblocks; n++)
2561     {
2562       bb = BASIC_BLOCK_FOR_FN (cfun, order[n]);
2563       freq = compute_call_stmt_bb_frequency (node->decl, bb);
2564       if (clobber_only_eh_bb_p (bb))
2565         {
2566           if (dump_file && (dump_flags & TDF_DETAILS))
2567             fprintf (dump_file, "\n Ignoring BB %i;"
2568                      " it will be optimized away by cleanup_clobbers\n",
2569                      bb->index);
2570           continue;
2571         }
2572
2573       /* TODO: Obviously predicates can be propagated down across CFG.  */
2574       if (fbi.info)
2575         {
2576           if (bb->aux)
2577             bb_predicate = *(struct predicate *) bb->aux;
2578           else
2579             bb_predicate = false_predicate ();
2580         }
2581       else
2582         bb_predicate = true_predicate ();
2583
2584       if (dump_file && (dump_flags & TDF_DETAILS))
2585         {
2586           fprintf (dump_file, "\n BB %i predicate:", bb->index);
2587           dump_predicate (dump_file, info->conds, &bb_predicate);
2588         }
2589
2590       if (fbi.info && nonconstant_names.exists ())
2591         {
2592           struct predicate phi_predicate;
2593           bool first_phi = true;
2594
2595           for (gphi_iterator bsi = gsi_start_phis (bb); !gsi_end_p (bsi);
2596                gsi_next (&bsi))
2597             {
2598               if (first_phi
2599                   && !phi_result_unknown_predicate (fbi.info, info, bb,
2600                                                     &phi_predicate,
2601                                                     nonconstant_names))
2602                 break;
2603               first_phi = false;
2604               if (dump_file && (dump_flags & TDF_DETAILS))
2605                 {
2606                   fprintf (dump_file, "  ");
2607                   print_gimple_stmt (dump_file, gsi_stmt (bsi), 0, 0);
2608                 }
2609               predicate_for_phi_result (info, bsi.phi (), &phi_predicate,
2610                                         nonconstant_names);
2611             }
2612         }
2613
2614       fix_builtin_expect_stmt = find_foldable_builtin_expect (bb);
2615
2616       for (gimple_stmt_iterator bsi = gsi_start_bb (bb); !gsi_end_p (bsi);
2617            gsi_next (&bsi))
2618         {
2619           gimple *stmt = gsi_stmt (bsi);
2620           int this_size = estimate_num_insns (stmt, &eni_size_weights);
2621           int this_time = estimate_num_insns (stmt, &eni_time_weights);
2622           int prob;
2623           struct predicate will_be_nonconstant;
2624
2625           /* This relation stmt should be folded after we remove
2626              buildin_expect call. Adjust the cost here.  */
2627           if (stmt == fix_builtin_expect_stmt)
2628             {
2629               this_size--;
2630               this_time--;
2631             }
2632
2633           if (dump_file && (dump_flags & TDF_DETAILS))
2634             {
2635               fprintf (dump_file, "  ");
2636               print_gimple_stmt (dump_file, stmt, 0, 0);
2637               fprintf (dump_file, "\t\tfreq:%3.2f size:%3i time:%3i\n",
2638                        ((double) freq) / CGRAPH_FREQ_BASE, this_size,
2639                        this_time);
2640             }
2641
2642           if (gimple_assign_load_p (stmt) && nonconstant_names.exists ())
2643             {
2644               struct predicate this_array_index;
2645               this_array_index =
2646                 array_index_predicate (info, nonconstant_names,
2647                                        gimple_assign_rhs1 (stmt));
2648               if (!false_predicate_p (&this_array_index))
2649                 array_index =
2650                   and_predicates (info->conds, &array_index,
2651                                   &this_array_index);
2652             }
2653           if (gimple_store_p (stmt) && nonconstant_names.exists ())
2654             {
2655               struct predicate this_array_index;
2656               this_array_index =
2657                 array_index_predicate (info, nonconstant_names,
2658                                        gimple_get_lhs (stmt));
2659               if (!false_predicate_p (&this_array_index))
2660                 array_index =
2661                   and_predicates (info->conds, &array_index,
2662                                   &this_array_index);
2663             }
2664
2665
2666           if (is_gimple_call (stmt)
2667               && !gimple_call_internal_p (stmt))
2668             {
2669               struct cgraph_edge *edge = node->get_edge (stmt);
2670               struct inline_edge_summary *es = inline_edge_summary (edge);
2671
2672               /* Special case: results of BUILT_IN_CONSTANT_P will be always
2673                  resolved as constant.  We however don't want to optimize
2674                  out the cgraph edges.  */
2675               if (nonconstant_names.exists ()
2676                   && gimple_call_builtin_p (stmt, BUILT_IN_CONSTANT_P)
2677                   && gimple_call_lhs (stmt)
2678                   && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
2679                 {
2680                   struct predicate false_p = false_predicate ();
2681                   nonconstant_names[SSA_NAME_VERSION (gimple_call_lhs (stmt))]
2682                     = false_p;
2683                 }
2684               if (ipa_node_params_sum)
2685                 {
2686                   int count = gimple_call_num_args (stmt);
2687                   int i;
2688
2689                   if (count)
2690                     es->param.safe_grow_cleared (count);
2691                   for (i = 0; i < count; i++)
2692                     {
2693                       int prob = param_change_prob (stmt, i);
2694                       gcc_assert (prob >= 0 && prob <= REG_BR_PROB_BASE);
2695                       es->param[i].change_prob = prob;
2696                     }
2697                 }
2698
2699               es->call_stmt_size = this_size;
2700               es->call_stmt_time = this_time;
2701               es->loop_depth = bb_loop_depth (bb);
2702               edge_set_predicate (edge, &bb_predicate);
2703             }
2704
2705           /* TODO: When conditional jump or swithc is known to be constant, but
2706              we did not translate it into the predicates, we really can account
2707              just maximum of the possible paths.  */
2708           if (fbi.info)
2709             will_be_nonconstant
2710               = will_be_nonconstant_predicate (&fbi, info,
2711                                                stmt, nonconstant_names);
2712           if (this_time || this_size)
2713             {
2714               struct predicate p;
2715
2716               this_time *= freq;
2717
2718               prob = eliminated_by_inlining_prob (stmt);
2719               if (prob == 1 && dump_file && (dump_flags & TDF_DETAILS))
2720                 fprintf (dump_file,
2721                          "\t\t50%% will be eliminated by inlining\n");
2722               if (prob == 2 && dump_file && (dump_flags & TDF_DETAILS))
2723                 fprintf (dump_file, "\t\tWill be eliminated by inlining\n");
2724
2725               if (fbi.info)
2726                 p = and_predicates (info->conds, &bb_predicate,
2727                                     &will_be_nonconstant);
2728               else
2729                 p = true_predicate ();
2730
2731               if (!false_predicate_p (&p)
2732                   || (is_gimple_call (stmt)
2733                       && !false_predicate_p (&bb_predicate)))
2734                 {
2735                   time += this_time;
2736                   size += this_size;
2737                   if (time > MAX_TIME * INLINE_TIME_SCALE)
2738                     time = MAX_TIME * INLINE_TIME_SCALE;
2739                 }
2740
2741               /* We account everything but the calls.  Calls have their own
2742                  size/time info attached to cgraph edges.  This is necessary
2743                  in order to make the cost disappear after inlining.  */
2744               if (!is_gimple_call (stmt))
2745                 {
2746                   if (prob)
2747                     {
2748                       struct predicate ip = not_inlined_predicate ();
2749                       ip = and_predicates (info->conds, &ip, &p);
2750                       account_size_time (info, this_size * prob,
2751                                          this_time * prob, &ip);
2752                     }
2753                   if (prob != 2)
2754                     account_size_time (info, this_size * (2 - prob),
2755                                        this_time * (2 - prob), &p);
2756                 }
2757
2758               if (!info->fp_expressions && fp_expression_p (stmt))
2759                 {
2760                   info->fp_expressions = true;
2761                   if (dump_file)
2762                     fprintf (dump_file, "   fp_expression set\n");
2763                 }
2764
2765               gcc_assert (time >= 0);
2766               gcc_assert (size >= 0);
2767             }
2768         }
2769     }
2770   set_hint_predicate (&inline_summaries->get (node)->array_index, array_index);
2771   time = (time + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
2772   if (time > MAX_TIME)
2773     time = MAX_TIME;
2774   free (order);
2775
2776   if (nonconstant_names.exists () && !early)
2777     {
2778       struct loop *loop;
2779       predicate loop_iterations = true_predicate ();
2780       predicate loop_stride = true_predicate ();
2781
2782       if (dump_file && (dump_flags & TDF_DETAILS))
2783         flow_loops_dump (dump_file, NULL, 0);
2784       scev_initialize ();
2785       FOR_EACH_LOOP (loop, 0)
2786         {
2787           vec<edge> exits;
2788           edge ex;
2789           unsigned int j;
2790           struct tree_niter_desc niter_desc;
2791           bb_predicate = *(struct predicate *) loop->header->aux;
2792
2793           exits = get_loop_exit_edges (loop);
2794           FOR_EACH_VEC_ELT (exits, j, ex)
2795             if (number_of_iterations_exit (loop, ex, &niter_desc, false)
2796                 && !is_gimple_min_invariant (niter_desc.niter))
2797             {
2798               predicate will_be_nonconstant
2799                 = will_be_nonconstant_expr_predicate (fbi.info, info,
2800                                                       niter_desc.niter,
2801                                                       nonconstant_names);
2802               if (!true_predicate_p (&will_be_nonconstant))
2803                 will_be_nonconstant = and_predicates (info->conds,
2804                                                       &bb_predicate,
2805                                                       &will_be_nonconstant);
2806               if (!true_predicate_p (&will_be_nonconstant)
2807                   && !false_predicate_p (&will_be_nonconstant))
2808                 /* This is slightly inprecise.  We may want to represent each
2809                    loop with independent predicate.  */
2810                 loop_iterations =
2811                   and_predicates (info->conds, &loop_iterations,
2812                                   &will_be_nonconstant);
2813             }
2814           exits.release ();
2815         }
2816
2817       /* To avoid quadratic behavior we analyze stride predicates only
2818          with respect to the containing loop.  Thus we simply iterate
2819          over all defs in the outermost loop body.  */
2820       for (loop = loops_for_fn (cfun)->tree_root->inner;
2821            loop != NULL; loop = loop->next)
2822         {
2823           basic_block *body = get_loop_body (loop);
2824           for (unsigned i = 0; i < loop->num_nodes; i++)
2825             {
2826               gimple_stmt_iterator gsi;
2827               bb_predicate = *(struct predicate *) body[i]->aux;
2828               for (gsi = gsi_start_bb (body[i]); !gsi_end_p (gsi);
2829                    gsi_next (&gsi))
2830                 {
2831                   gimple *stmt = gsi_stmt (gsi);
2832
2833                   if (!is_gimple_assign (stmt))
2834                     continue;
2835
2836                   tree def = gimple_assign_lhs (stmt);
2837                   if (TREE_CODE (def) != SSA_NAME)
2838                     continue;
2839
2840                   affine_iv iv;
2841                   if (!simple_iv (loop_containing_stmt (stmt),
2842                                   loop_containing_stmt (stmt),
2843                                   def, &iv, true)
2844                       || is_gimple_min_invariant (iv.step))
2845                     continue;
2846
2847                   predicate will_be_nonconstant
2848                     = will_be_nonconstant_expr_predicate (fbi.info, info,
2849                                                           iv.step,
2850                                                           nonconstant_names);
2851                   if (!true_predicate_p (&will_be_nonconstant))
2852                     will_be_nonconstant
2853                       = and_predicates (info->conds, &bb_predicate,
2854                                         &will_be_nonconstant);
2855                   if (!true_predicate_p (&will_be_nonconstant)
2856                       && !false_predicate_p (&will_be_nonconstant))
2857                     /* This is slightly inprecise.  We may want to represent
2858                        each loop with independent predicate.  */
2859                     loop_stride = and_predicates (info->conds, &loop_stride,
2860                                                   &will_be_nonconstant);
2861                 }
2862             }
2863           free (body);
2864         }
2865       set_hint_predicate (&inline_summaries->get (node)->loop_iterations,
2866                           loop_iterations);
2867       set_hint_predicate (&inline_summaries->get (node)->loop_stride,
2868                           loop_stride);
2869       scev_finalize ();
2870     }
2871   FOR_ALL_BB_FN (bb, my_function)
2872     {
2873       edge e;
2874       edge_iterator ei;
2875
2876       if (bb->aux)
2877         edge_predicate_pool.remove ((predicate *)bb->aux);
2878       bb->aux = NULL;
2879       FOR_EACH_EDGE (e, ei, bb->succs)
2880         {
2881           if (e->aux)
2882             edge_predicate_pool.remove ((predicate *) e->aux);
2883           e->aux = NULL;
2884         }
2885     }
2886   inline_summaries->get (node)->self_time = time;
2887   inline_summaries->get (node)->self_size = size;
2888   nonconstant_names.release ();
2889   ipa_release_body_info (&fbi);
2890   if (opt_for_fn (node->decl, optimize))
2891     {
2892       if (!early)
2893         loop_optimizer_finalize ();
2894       else if (!ipa_edge_args_vector)
2895         ipa_free_all_node_params ();
2896       free_dominance_info (CDI_DOMINATORS);
2897     }
2898   if (dump_file)
2899     {
2900       fprintf (dump_file, "\n");
2901       dump_inline_summary (dump_file, node);
2902     }
2903 }
2904
2905
2906 /* Compute parameters of functions used by inliner.
2907    EARLY is true when we compute parameters for the early inliner  */
2908
2909 void
2910 compute_inline_parameters (struct cgraph_node *node, bool early)
2911 {
2912   HOST_WIDE_INT self_stack_size;
2913   struct cgraph_edge *e;
2914   struct inline_summary *info;
2915
2916   gcc_assert (!node->global.inlined_to);
2917
2918   inline_summary_alloc ();
2919
2920   info = inline_summaries->get (node);
2921   reset_inline_summary (node, info);
2922
2923   /* FIXME: Thunks are inlinable, but tree-inline don't know how to do that.
2924      Once this happen, we will need to more curefully predict call
2925      statement size.  */
2926   if (node->thunk.thunk_p)
2927     {
2928       struct inline_edge_summary *es = inline_edge_summary (node->callees);
2929       struct predicate t = true_predicate ();
2930
2931       info->inlinable = 0;
2932       node->callees->inline_failed = CIF_THUNK;
2933       node->local.can_change_signature = false;
2934       es->call_stmt_time = 1;
2935       es->call_stmt_size = 1;
2936       account_size_time (info, 0, 0, &t);
2937       return;
2938     }
2939
2940   /* Even is_gimple_min_invariant rely on current_function_decl.  */
2941   push_cfun (DECL_STRUCT_FUNCTION (node->decl));
2942
2943   /* Estimate the stack size for the function if we're optimizing.  */
2944   self_stack_size = optimize ? estimated_stack_frame_size (node) : 0;
2945   info->estimated_self_stack_size = self_stack_size;
2946   info->estimated_stack_size = self_stack_size;
2947   info->stack_frame_offset = 0;
2948
2949   /* Can this function be inlined at all?  */
2950   if (!opt_for_fn (node->decl, optimize)
2951       && !lookup_attribute ("always_inline",
2952                             DECL_ATTRIBUTES (node->decl)))
2953     info->inlinable = false;
2954   else
2955     info->inlinable = tree_inlinable_function_p (node->decl);
2956
2957   info->contains_cilk_spawn = fn_contains_cilk_spawn_p (cfun);
2958
2959   /* Type attributes can use parameter indices to describe them.  */
2960   if (TYPE_ATTRIBUTES (TREE_TYPE (node->decl)))
2961     node->local.can_change_signature = false;
2962   else
2963     {
2964       /* Otherwise, inlinable functions always can change signature.  */
2965       if (info->inlinable)
2966         node->local.can_change_signature = true;
2967       else
2968         {
2969           /* Functions calling builtin_apply can not change signature.  */
2970           for (e = node->callees; e; e = e->next_callee)
2971             {
2972               tree cdecl = e->callee->decl;
2973               if (DECL_BUILT_IN (cdecl)
2974                   && DECL_BUILT_IN_CLASS (cdecl) == BUILT_IN_NORMAL
2975                   && (DECL_FUNCTION_CODE (cdecl) == BUILT_IN_APPLY_ARGS
2976                       || DECL_FUNCTION_CODE (cdecl) == BUILT_IN_VA_START))
2977                 break;
2978             }
2979           node->local.can_change_signature = !e;
2980         }
2981     }
2982   estimate_function_body_sizes (node, early);
2983
2984   for (e = node->callees; e; e = e->next_callee)
2985     if (e->callee->comdat_local_p ())
2986       break;
2987   node->calls_comdat_local = (e != NULL);
2988
2989   /* Inlining characteristics are maintained by the cgraph_mark_inline.  */
2990   info->time = info->self_time;
2991   info->size = info->self_size;
2992   info->stack_frame_offset = 0;
2993   info->estimated_stack_size = info->estimated_self_stack_size;
2994   if (flag_checking)
2995     {
2996       inline_update_overall_summary (node);
2997       gcc_assert (info->time == info->self_time
2998                   && info->size == info->self_size);
2999     }
3000
3001   pop_cfun ();
3002 }
3003
3004
3005 /* Compute parameters of functions used by inliner using
3006    current_function_decl.  */
3007
3008 static unsigned int
3009 compute_inline_parameters_for_current (void)
3010 {
3011   compute_inline_parameters (cgraph_node::get (current_function_decl), true);
3012   return 0;
3013 }
3014
3015 namespace {
3016
3017 const pass_data pass_data_inline_parameters =
3018 {
3019   GIMPLE_PASS, /* type */
3020   "inline_param", /* name */
3021   OPTGROUP_INLINE, /* optinfo_flags */
3022   TV_INLINE_PARAMETERS, /* tv_id */
3023   0, /* properties_required */
3024   0, /* properties_provided */
3025   0, /* properties_destroyed */
3026   0, /* todo_flags_start */
3027   0, /* todo_flags_finish */
3028 };
3029
3030 class pass_inline_parameters : public gimple_opt_pass
3031 {
3032 public:
3033   pass_inline_parameters (gcc::context *ctxt)
3034     : gimple_opt_pass (pass_data_inline_parameters, ctxt)
3035   {}
3036
3037   /* opt_pass methods: */
3038   opt_pass * clone () { return new pass_inline_parameters (m_ctxt); }
3039   virtual unsigned int execute (function *)
3040     {
3041       return compute_inline_parameters_for_current ();
3042     }
3043
3044 }; // class pass_inline_parameters
3045
3046 } // anon namespace
3047
3048 gimple_opt_pass *
3049 make_pass_inline_parameters (gcc::context *ctxt)
3050 {
3051   return new pass_inline_parameters (ctxt);
3052 }
3053
3054
3055 /* Estimate benefit devirtualizing indirect edge IE, provided KNOWN_VALS,
3056    KNOWN_CONTEXTS and KNOWN_AGGS.  */
3057
3058 static bool
3059 estimate_edge_devirt_benefit (struct cgraph_edge *ie,
3060                               int *size, int *time,
3061                               vec<tree> known_vals,
3062                               vec<ipa_polymorphic_call_context> known_contexts,
3063                               vec<ipa_agg_jump_function_p> known_aggs)
3064 {
3065   tree target;
3066   struct cgraph_node *callee;
3067   struct inline_summary *isummary;
3068   enum availability avail;
3069   bool speculative;
3070
3071   if (!known_vals.exists () && !known_contexts.exists ())
3072     return false;
3073   if (!opt_for_fn (ie->caller->decl, flag_indirect_inlining))
3074     return false;
3075
3076   target = ipa_get_indirect_edge_target (ie, known_vals, known_contexts,
3077                                          known_aggs, &speculative);
3078   if (!target || speculative)
3079     return false;
3080
3081   /* Account for difference in cost between indirect and direct calls.  */
3082   *size -= (eni_size_weights.indirect_call_cost - eni_size_weights.call_cost);
3083   *time -= (eni_time_weights.indirect_call_cost - eni_time_weights.call_cost);
3084   gcc_checking_assert (*time >= 0);
3085   gcc_checking_assert (*size >= 0);
3086
3087   callee = cgraph_node::get (target);
3088   if (!callee || !callee->definition)
3089     return false;
3090   callee = callee->function_symbol (&avail);
3091   if (avail < AVAIL_AVAILABLE)
3092     return false;
3093   isummary = inline_summaries->get (callee);
3094   return isummary->inlinable;
3095 }
3096
3097 /* Increase SIZE, MIN_SIZE (if non-NULL) and TIME for size and time needed to
3098    handle edge E with probability PROB.
3099    Set HINTS if edge may be devirtualized.
3100    KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS describe context of the call
3101    site.  */
3102
3103 static inline void
3104 estimate_edge_size_and_time (struct cgraph_edge *e, int *size, int *min_size,
3105                              int *time,
3106                              int prob,
3107                              vec<tree> known_vals,
3108                              vec<ipa_polymorphic_call_context> known_contexts,
3109                              vec<ipa_agg_jump_function_p> known_aggs,
3110                              inline_hints *hints)
3111 {
3112   struct inline_edge_summary *es = inline_edge_summary (e);
3113   int call_size = es->call_stmt_size;
3114   int call_time = es->call_stmt_time;
3115   int cur_size;
3116   if (!e->callee
3117       && estimate_edge_devirt_benefit (e, &call_size, &call_time,
3118                                        known_vals, known_contexts, known_aggs)
3119       && hints && e->maybe_hot_p ())
3120     *hints |= INLINE_HINT_indirect_call;
3121   cur_size = call_size * INLINE_SIZE_SCALE;
3122   *size += cur_size;
3123   if (min_size)
3124     *min_size += cur_size;
3125   *time += apply_probability ((gcov_type) call_time, prob)
3126     * e->frequency * (INLINE_TIME_SCALE / CGRAPH_FREQ_BASE);
3127   if (*time > MAX_TIME * INLINE_TIME_SCALE)
3128     *time = MAX_TIME * INLINE_TIME_SCALE;
3129 }
3130
3131
3132
3133 /* Increase SIZE, MIN_SIZE and TIME for size and time needed to handle all
3134    calls in NODE.  POSSIBLE_TRUTHS, KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS
3135    describe context of the call site.  */
3136
3137 static void
3138 estimate_calls_size_and_time (struct cgraph_node *node, int *size,
3139                               int *min_size, int *time,
3140                               inline_hints *hints,
3141                               clause_t possible_truths,
3142                               vec<tree> known_vals,
3143                               vec<ipa_polymorphic_call_context> known_contexts,
3144                               vec<ipa_agg_jump_function_p> known_aggs)
3145 {
3146   struct cgraph_edge *e;
3147   for (e = node->callees; e; e = e->next_callee)
3148     {
3149       if (inline_edge_summary_vec.length () <= (unsigned) e->uid)
3150         continue;
3151
3152       struct inline_edge_summary *es = inline_edge_summary (e);
3153
3154       /* Do not care about zero sized builtins.  */
3155       if (e->inline_failed && !es->call_stmt_size)
3156         {
3157           gcc_checking_assert (!es->call_stmt_time);
3158           continue;
3159         }
3160       if (!es->predicate
3161           || evaluate_predicate (es->predicate, possible_truths))
3162         {
3163           if (e->inline_failed)
3164             {
3165               /* Predicates of calls shall not use NOT_CHANGED codes,
3166                  sowe do not need to compute probabilities.  */
3167               estimate_edge_size_and_time (e, size,
3168                                            es->predicate ? NULL : min_size,
3169                                            time, REG_BR_PROB_BASE,
3170                                            known_vals, known_contexts,
3171                                            known_aggs, hints);
3172             }
3173           else
3174             estimate_calls_size_and_time (e->callee, size, min_size, time,
3175                                           hints,
3176                                           possible_truths,
3177                                           known_vals, known_contexts,
3178                                           known_aggs);
3179         }
3180     }
3181   for (e = node->indirect_calls; e; e = e->next_callee)
3182     {
3183       if (inline_edge_summary_vec.length () <= (unsigned) e->uid)
3184         continue;
3185
3186       struct inline_edge_summary *es = inline_edge_summary (e);
3187       if (!es->predicate
3188           || evaluate_predicate (es->predicate, possible_truths))
3189         estimate_edge_size_and_time (e, size,
3190                                      es->predicate ? NULL : min_size,
3191                                      time, REG_BR_PROB_BASE,
3192                                      known_vals, known_contexts, known_aggs,
3193                                      hints);
3194     }
3195 }
3196
3197
3198 /* Estimate size and time needed to execute NODE assuming
3199    POSSIBLE_TRUTHS clause, and KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS
3200    information about NODE's arguments.  If non-NULL use also probability
3201    information present in INLINE_PARAM_SUMMARY vector.
3202    Additionally detemine hints determined by the context.  Finally compute
3203    minimal size needed for the call that is independent on the call context and
3204    can be used for fast estimates.  Return the values in RET_SIZE,
3205    RET_MIN_SIZE, RET_TIME and RET_HINTS.  */
3206
3207 static void
3208 estimate_node_size_and_time (struct cgraph_node *node,
3209                              clause_t possible_truths,
3210                              vec<tree> known_vals,
3211                              vec<ipa_polymorphic_call_context> known_contexts,
3212                              vec<ipa_agg_jump_function_p> known_aggs,
3213                              int *ret_size, int *ret_min_size, int *ret_time,
3214                              inline_hints *ret_hints,
3215                              vec<inline_param_summary>
3216                              inline_param_summary)
3217 {
3218   struct inline_summary *info = inline_summaries->get (node);
3219   size_time_entry *e;
3220   int size = 0;
3221   int time = 0;
3222   int min_size = 0;
3223   inline_hints hints = 0;
3224   int i;
3225
3226   if (dump_file && (dump_flags & TDF_DETAILS))
3227     {
3228       bool found = false;
3229       fprintf (dump_file, "   Estimating body: %s/%i\n"
3230                "   Known to be false: ", node->name (),
3231                node->order);
3232
3233       for (i = predicate_not_inlined_condition;
3234            i < (predicate_first_dynamic_condition
3235                 + (int) vec_safe_length (info->conds)); i++)
3236         if (!(possible_truths & (1 << i)))
3237           {
3238             if (found)
3239               fprintf (dump_file, ", ");
3240             found = true;
3241             dump_condition (dump_file, info->conds, i);
3242           }
3243     }
3244
3245   for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
3246     if (evaluate_predicate (&e->predicate, possible_truths))
3247       {
3248         size += e->size;
3249         gcc_checking_assert (e->time >= 0);
3250         gcc_checking_assert (time >= 0);
3251         if (!inline_param_summary.exists ())
3252           time += e->time;
3253         else
3254           {
3255             int prob = predicate_probability (info->conds,
3256                                               &e->predicate,
3257                                               possible_truths,
3258                                               inline_param_summary);
3259             gcc_checking_assert (prob >= 0);
3260             gcc_checking_assert (prob <= REG_BR_PROB_BASE);
3261             time += apply_probability ((gcov_type) e->time, prob);
3262           }
3263         if (time > MAX_TIME * INLINE_TIME_SCALE)
3264           time = MAX_TIME * INLINE_TIME_SCALE;
3265         gcc_checking_assert (time >= 0);
3266
3267       }
3268   gcc_checking_assert (true_predicate_p (&(*info->entry)[0].predicate));
3269   min_size = (*info->entry)[0].size;
3270   gcc_checking_assert (size >= 0);
3271   gcc_checking_assert (time >= 0);
3272
3273   if (info->loop_iterations
3274       && !evaluate_predicate (info->loop_iterations, possible_truths))
3275     hints |= INLINE_HINT_loop_iterations;
3276   if (info->loop_stride
3277       && !evaluate_predicate (info->loop_stride, possible_truths))
3278     hints |= INLINE_HINT_loop_stride;
3279   if (info->array_index
3280       && !evaluate_predicate (info->array_index, possible_truths))
3281     hints |= INLINE_HINT_array_index;
3282   if (info->scc_no)
3283     hints |= INLINE_HINT_in_scc;
3284   if (DECL_DECLARED_INLINE_P (node->decl))
3285     hints |= INLINE_HINT_declared_inline;
3286
3287   estimate_calls_size_and_time (node, &size, &min_size, &time, &hints, possible_truths,
3288                                 known_vals, known_contexts, known_aggs);
3289   gcc_checking_assert (size >= 0);
3290   gcc_checking_assert (time >= 0);
3291   time = RDIV (time, INLINE_TIME_SCALE);
3292   size = RDIV (size, INLINE_SIZE_SCALE);
3293   min_size = RDIV (min_size, INLINE_SIZE_SCALE);
3294
3295   if (dump_file && (dump_flags & TDF_DETAILS))
3296     fprintf (dump_file, "\n   size:%i time:%i\n", (int) size, (int) time);
3297   if (ret_time)
3298     *ret_time = time;
3299   if (ret_size)
3300     *ret_size = size;
3301   if (ret_min_size)
3302     *ret_min_size = min_size;
3303   if (ret_hints)
3304     *ret_hints = hints;
3305   return;
3306 }
3307
3308
3309 /* Estimate size and time needed to execute callee of EDGE assuming that
3310    parameters known to be constant at caller of EDGE are propagated.
3311    KNOWN_VALS and KNOWN_CONTEXTS are vectors of assumed known constant values
3312    and types for parameters.  */
3313
3314 void
3315 estimate_ipcp_clone_size_and_time (struct cgraph_node *node,
3316                                    vec<tree> known_vals,
3317                                    vec<ipa_polymorphic_call_context>
3318                                    known_contexts,
3319                                    vec<ipa_agg_jump_function_p> known_aggs,
3320                                    int *ret_size, int *ret_time,
3321                                    inline_hints *hints)
3322 {
3323   clause_t clause;
3324
3325   clause = evaluate_conditions_for_known_args (node, false, known_vals,
3326                                                known_aggs);
3327   estimate_node_size_and_time (node, clause, known_vals, known_contexts,
3328                                known_aggs, ret_size, NULL, ret_time, hints, vNULL);
3329 }
3330
3331 /* Translate all conditions from callee representation into caller
3332    representation and symbolically evaluate predicate P into new predicate.
3333
3334    INFO is inline_summary of function we are adding predicate into, CALLEE_INFO
3335    is summary of function predicate P is from. OPERAND_MAP is array giving
3336    callee formal IDs the caller formal IDs. POSSSIBLE_TRUTHS is clausule of all
3337    callee conditions that may be true in caller context.  TOPLEV_PREDICATE is
3338    predicate under which callee is executed.  OFFSET_MAP is an array of of
3339    offsets that need to be added to conditions, negative offset means that
3340    conditions relying on values passed by reference have to be discarded
3341    because they might not be preserved (and should be considered offset zero
3342    for other purposes).  */
3343
3344 static struct predicate
3345 remap_predicate (struct inline_summary *info,
3346                  struct inline_summary *callee_info,
3347                  struct predicate *p,
3348                  vec<int> operand_map,
3349                  vec<int> offset_map,
3350                  clause_t possible_truths, struct predicate *toplev_predicate)
3351 {
3352   int i;
3353   struct predicate out = true_predicate ();
3354
3355   /* True predicate is easy.  */
3356   if (true_predicate_p (p))
3357     return *toplev_predicate;
3358   for (i = 0; p->clause[i]; i++)
3359     {
3360       clause_t clause = p->clause[i];
3361       int cond;
3362       struct predicate clause_predicate = false_predicate ();
3363
3364       gcc_assert (i < MAX_CLAUSES);
3365
3366       for (cond = 0; cond < NUM_CONDITIONS; cond++)
3367         /* Do we have condition we can't disprove?   */
3368         if (clause & possible_truths & (1 << cond))
3369           {
3370             struct predicate cond_predicate;
3371             /* Work out if the condition can translate to predicate in the
3372                inlined function.  */
3373             if (cond >= predicate_first_dynamic_condition)
3374               {
3375                 struct condition *c;
3376
3377                 c = &(*callee_info->conds)[cond
3378                                            -
3379                                            predicate_first_dynamic_condition];
3380                 /* See if we can remap condition operand to caller's operand.
3381                    Otherwise give up.  */
3382                 if (!operand_map.exists ()
3383                     || (int) operand_map.length () <= c->operand_num
3384                     || operand_map[c->operand_num] == -1
3385                     /* TODO: For non-aggregate conditions, adding an offset is
3386                        basically an arithmetic jump function processing which
3387                        we should support in future.  */
3388                     || ((!c->agg_contents || !c->by_ref)
3389                         && offset_map[c->operand_num] > 0)
3390                     || (c->agg_contents && c->by_ref
3391                         && offset_map[c->operand_num] < 0))
3392                   cond_predicate = true_predicate ();
3393                 else
3394                   {
3395                     struct agg_position_info ap;
3396                     HOST_WIDE_INT offset_delta = offset_map[c->operand_num];
3397                     if (offset_delta < 0)
3398                       {
3399                         gcc_checking_assert (!c->agg_contents || !c->by_ref);
3400                         offset_delta = 0;
3401                       }
3402                     gcc_assert (!c->agg_contents
3403                                 || c->by_ref || offset_delta == 0);
3404                     ap.offset = c->offset + offset_delta;
3405                     ap.agg_contents = c->agg_contents;
3406                     ap.by_ref = c->by_ref;
3407                     cond_predicate = add_condition (info,
3408                                                     operand_map[c->operand_num],
3409                                                     &ap, c->code, c->val);
3410                   }
3411               }
3412             /* Fixed conditions remains same, construct single
3413                condition predicate.  */
3414             else
3415               {
3416                 cond_predicate.clause[0] = 1 << cond;
3417                 cond_predicate.clause[1] = 0;
3418               }
3419             clause_predicate = or_predicates (info->conds, &clause_predicate,
3420                                               &cond_predicate);
3421           }
3422       out = and_predicates (info->conds, &out, &clause_predicate);
3423     }
3424   return and_predicates (info->conds, &out, toplev_predicate);
3425 }
3426
3427
3428 /* Update summary information of inline clones after inlining.
3429    Compute peak stack usage.  */
3430
3431 static void
3432 inline_update_callee_summaries (struct cgraph_node *node, int depth)
3433 {
3434   struct cgraph_edge *e;
3435   struct inline_summary *callee_info = inline_summaries->get (node);
3436   struct inline_summary *caller_info = inline_summaries->get (node->callers->caller);
3437   HOST_WIDE_INT peak;
3438
3439   callee_info->stack_frame_offset
3440     = caller_info->stack_frame_offset
3441     + caller_info->estimated_self_stack_size;
3442   peak = callee_info->stack_frame_offset
3443     + callee_info->estimated_self_stack_size;
3444   if (inline_summaries->get (node->global.inlined_to)->estimated_stack_size < peak)
3445       inline_summaries->get (node->global.inlined_to)->estimated_stack_size = peak;
3446   ipa_propagate_frequency (node);
3447   for (e = node->callees; e; e = e->next_callee)
3448     {
3449       if (!e->inline_failed)
3450         inline_update_callee_summaries (e->callee, depth);
3451       inline_edge_summary (e)->loop_depth += depth;
3452     }
3453   for (e = node->indirect_calls; e; e = e->next_callee)
3454     inline_edge_summary (e)->loop_depth += depth;
3455 }
3456
3457 /* Update change_prob of EDGE after INLINED_EDGE has been inlined.
3458    When functoin A is inlined in B and A calls C with parameter that
3459    changes with probability PROB1 and C is known to be passthroug
3460    of argument if B that change with probability PROB2, the probability
3461    of change is now PROB1*PROB2.  */
3462
3463 static void
3464 remap_edge_change_prob (struct cgraph_edge *inlined_edge,
3465                         struct cgraph_edge *edge)
3466 {
3467   if (ipa_node_params_sum)
3468     {
3469       int i;
3470       struct ipa_edge_args *args = IPA_EDGE_REF (edge);
3471       struct inline_edge_summary *es = inline_edge_summary (edge);
3472       struct inline_edge_summary *inlined_es
3473         = inline_edge_summary (inlined_edge);
3474
3475       for (i = 0; i < ipa_get_cs_argument_count (args); i++)
3476         {
3477           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3478           if (jfunc->type == IPA_JF_PASS_THROUGH
3479               && (ipa_get_jf_pass_through_formal_id (jfunc)
3480                   < (int) inlined_es->param.length ()))
3481             {
3482               int jf_formal_id = ipa_get_jf_pass_through_formal_id (jfunc);
3483               int prob1 = es->param[i].change_prob;
3484               int prob2 = inlined_es->param[jf_formal_id].change_prob;
3485               int prob = combine_probabilities (prob1, prob2);
3486
3487               if (prob1 && prob2 && !prob)
3488                 prob = 1;
3489
3490               es->param[i].change_prob = prob;
3491             }
3492         }
3493     }
3494 }
3495
3496 /* Update edge summaries of NODE after INLINED_EDGE has been inlined.
3497
3498    Remap predicates of callees of NODE.  Rest of arguments match
3499    remap_predicate.
3500
3501    Also update change probabilities.  */
3502
3503 static void
3504 remap_edge_summaries (struct cgraph_edge *inlined_edge,
3505                       struct cgraph_node *node,
3506                       struct inline_summary *info,
3507                       struct inline_summary *callee_info,
3508                       vec<int> operand_map,
3509                       vec<int> offset_map,
3510                       clause_t possible_truths,
3511                       struct predicate *toplev_predicate)
3512 {
3513   struct cgraph_edge *e, *next;
3514   for (e = node->callees; e; e = next)
3515     {
3516       struct inline_edge_summary *es = inline_edge_summary (e);
3517       struct predicate p;
3518       next = e->next_callee;
3519
3520       if (e->inline_failed)
3521         {
3522           remap_edge_change_prob (inlined_edge, e);
3523
3524           if (es->predicate)
3525             {
3526               p = remap_predicate (info, callee_info,
3527                                    es->predicate, operand_map, offset_map,
3528                                    possible_truths, toplev_predicate);
3529               edge_set_predicate (e, &p);
3530             }
3531           else
3532             edge_set_predicate (e, toplev_predicate);
3533         }
3534       else
3535         remap_edge_summaries (inlined_edge, e->callee, info, callee_info,
3536                               operand_map, offset_map, possible_truths,
3537                               toplev_predicate);
3538     }
3539   for (e = node->indirect_calls; e; e = next)
3540     {
3541       struct inline_edge_summary *es = inline_edge_summary (e);
3542       struct predicate p;
3543       next = e->next_callee;
3544
3545       remap_edge_change_prob (inlined_edge, e);
3546       if (es->predicate)
3547         {
3548           p = remap_predicate (info, callee_info,
3549                                es->predicate, operand_map, offset_map,
3550                                possible_truths, toplev_predicate);
3551           edge_set_predicate (e, &p);
3552         }
3553       else
3554         edge_set_predicate (e, toplev_predicate);
3555     }
3556 }
3557
3558 /* Same as remap_predicate, but set result into hint *HINT.  */
3559
3560 static void
3561 remap_hint_predicate (struct inline_summary *info,
3562                       struct inline_summary *callee_info,
3563                       struct predicate **hint,
3564                       vec<int> operand_map,
3565                       vec<int> offset_map,
3566                       clause_t possible_truths,
3567                       struct predicate *toplev_predicate)
3568 {
3569   predicate p;
3570
3571   if (!*hint)
3572     return;
3573   p = remap_predicate (info, callee_info,
3574                        *hint,
3575                        operand_map, offset_map,
3576                        possible_truths, toplev_predicate);
3577   if (!false_predicate_p (&p) && !true_predicate_p (&p))
3578     {
3579       if (!*hint)
3580         set_hint_predicate (hint, p);
3581       else
3582         **hint = and_predicates (info->conds, *hint, &p);
3583     }
3584 }
3585
3586 /* We inlined EDGE.  Update summary of the function we inlined into.  */
3587
3588 void
3589 inline_merge_summary (struct cgraph_edge *edge)
3590 {
3591   struct inline_summary *callee_info = inline_summaries->get (edge->callee);
3592   struct cgraph_node *to = (edge->caller->global.inlined_to
3593                             ? edge->caller->global.inlined_to : edge->caller);
3594   struct inline_summary *info = inline_summaries->get (to);
3595   clause_t clause = 0;          /* not_inline is known to be false.  */
3596   size_time_entry *e;
3597   vec<int> operand_map = vNULL;
3598   vec<int> offset_map = vNULL;
3599   int i;
3600   struct predicate toplev_predicate;
3601   struct predicate true_p = true_predicate ();
3602   struct inline_edge_summary *es = inline_edge_summary (edge);
3603
3604   if (es->predicate)
3605     toplev_predicate = *es->predicate;
3606   else
3607     toplev_predicate = true_predicate ();
3608
3609   info->fp_expressions |= callee_info->fp_expressions;
3610
3611   if (callee_info->conds)
3612     evaluate_properties_for_edge (edge, true, &clause, NULL, NULL, NULL);
3613   if (ipa_node_params_sum && callee_info->conds)
3614     {
3615       struct ipa_edge_args *args = IPA_EDGE_REF (edge);
3616       int count = ipa_get_cs_argument_count (args);
3617       int i;
3618
3619       if (count)
3620         {
3621           operand_map.safe_grow_cleared (count);
3622           offset_map.safe_grow_cleared (count);
3623         }
3624       for (i = 0; i < count; i++)
3625         {
3626           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3627           int map = -1;
3628
3629           /* TODO: handle non-NOPs when merging.  */
3630           if (jfunc->type == IPA_JF_PASS_THROUGH)
3631             {
3632               if (ipa_get_jf_pass_through_operation (jfunc) == NOP_EXPR)
3633                 map = ipa_get_jf_pass_through_formal_id (jfunc);
3634               if (!ipa_get_jf_pass_through_agg_preserved (jfunc))
3635                 offset_map[i] = -1;
3636             }
3637           else if (jfunc->type == IPA_JF_ANCESTOR)
3638             {
3639               HOST_WIDE_INT offset = ipa_get_jf_ancestor_offset (jfunc);
3640               if (offset >= 0 && offset < INT_MAX)
3641                 {
3642                   map = ipa_get_jf_ancestor_formal_id (jfunc);
3643                   if (!ipa_get_jf_ancestor_agg_preserved (jfunc))
3644                     offset = -1;
3645                   offset_map[i] = offset;
3646                 }
3647             }
3648           operand_map[i] = map;
3649           gcc_assert (map < ipa_get_param_count (IPA_NODE_REF (to)));
3650         }
3651     }
3652   for (i = 0; vec_safe_iterate (callee_info->entry, i, &e); i++)
3653     {
3654       struct predicate p = remap_predicate (info, callee_info,
3655                                             &e->predicate, operand_map,
3656                                             offset_map, clause,
3657                                             &toplev_predicate);
3658       if (!false_predicate_p (&p))
3659         {
3660           gcov_type add_time = ((gcov_type) e->time * edge->frequency
3661                                 + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
3662           int prob = predicate_probability (callee_info->conds,
3663                                             &e->predicate,
3664                                             clause, es->param);
3665           add_time = apply_probability ((gcov_type) add_time, prob);
3666           if (add_time > MAX_TIME * INLINE_TIME_SCALE)
3667             add_time = MAX_TIME * INLINE_TIME_SCALE;
3668           if (prob != REG_BR_PROB_BASE
3669               && dump_file && (dump_flags & TDF_DETAILS))
3670             {
3671               fprintf (dump_file, "\t\tScaling time by probability:%f\n",
3672                        (double) prob / REG_BR_PROB_BASE);
3673             }
3674           account_size_time (info, e->size, add_time, &p);
3675         }
3676     }
3677   remap_edge_summaries (edge, edge->callee, info, callee_info, operand_map,
3678                         offset_map, clause, &toplev_predicate);
3679   remap_hint_predicate (info, callee_info,
3680                         &callee_info->loop_iterations,
3681                         operand_map, offset_map, clause, &toplev_predicate);
3682   remap_hint_predicate (info, callee_info,
3683                         &callee_info->loop_stride,
3684                         operand_map, offset_map, clause, &toplev_predicate);
3685   remap_hint_predicate (info, callee_info,
3686                         &callee_info->array_index,
3687                         operand_map, offset_map, clause, &toplev_predicate);
3688
3689   inline_update_callee_summaries (edge->callee,
3690                                   inline_edge_summary (edge)->loop_depth);
3691
3692   /* We do not maintain predicates of inlined edges, free it.  */
3693   edge_set_predicate (edge, &true_p);
3694   /* Similarly remove param summaries.  */
3695   es->param.release ();
3696   operand_map.release ();
3697   offset_map.release ();
3698 }
3699
3700 /* For performance reasons inline_merge_summary is not updating overall size
3701    and time.  Recompute it.  */
3702
3703 void
3704 inline_update_overall_summary (struct cgraph_node *node)
3705 {
3706   struct inline_summary *info = inline_summaries->get (node);
3707   size_time_entry *e;
3708   int i;
3709
3710   info->size = 0;
3711   info->time = 0;
3712   for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
3713     {
3714       info->size += e->size, info->time += e->time;
3715       if (info->time > MAX_TIME * INLINE_TIME_SCALE)
3716         info->time = MAX_TIME * INLINE_TIME_SCALE;
3717     }
3718   estimate_calls_size_and_time (node, &info->size, &info->min_size,
3719                                 &info->time, NULL,
3720                                 ~(clause_t) (1 << predicate_false_condition),
3721                                 vNULL, vNULL, vNULL);
3722   info->time = (info->time + INLINE_TIME_SCALE / 2) / INLINE_TIME_SCALE;
3723   info->size = (info->size + INLINE_SIZE_SCALE / 2) / INLINE_SIZE_SCALE;
3724 }
3725
3726 /* Return hints derrived from EDGE.   */
3727 int
3728 simple_edge_hints (struct cgraph_edge *edge)
3729 {
3730   int hints = 0;
3731   struct cgraph_node *to = (edge->caller->global.inlined_to
3732                             ? edge->caller->global.inlined_to : edge->caller);
3733   struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
3734   if (inline_summaries->get (to)->scc_no
3735       && inline_summaries->get (to)->scc_no
3736          == inline_summaries->get (callee)->scc_no
3737       && !edge->recursive_p ())
3738     hints |= INLINE_HINT_same_scc;
3739
3740   if (callee->lto_file_data && edge->caller->lto_file_data
3741       && edge->caller->lto_file_data != callee->lto_file_data
3742       && !callee->merged_comdat && !callee->icf_merged)
3743     hints |= INLINE_HINT_cross_module;
3744
3745   return hints;
3746 }
3747
3748 /* Estimate the time cost for the caller when inlining EDGE.
3749    Only to be called via estimate_edge_time, that handles the
3750    caching mechanism.
3751
3752    When caching, also update the cache entry.  Compute both time and
3753    size, since we always need both metrics eventually.  */
3754
3755 int
3756 do_estimate_edge_time (struct cgraph_edge *edge)
3757 {
3758   int time;
3759   int size;
3760   inline_hints hints;
3761   struct cgraph_node *callee;
3762   clause_t clause;
3763   vec<tree> known_vals;
3764   vec<ipa_polymorphic_call_context> known_contexts;
3765   vec<ipa_agg_jump_function_p> known_aggs;
3766   struct inline_edge_summary *es = inline_edge_summary (edge);
3767   int min_size;
3768
3769   callee = edge->callee->ultimate_alias_target ();
3770
3771   gcc_checking_assert (edge->inline_failed);
3772   evaluate_properties_for_edge (edge, true,
3773                                 &clause, &known_vals, &known_contexts,
3774                                 &known_aggs);
3775   estimate_node_size_and_time (callee, clause, known_vals, known_contexts,
3776                                known_aggs, &size, &min_size, &time, &hints, es->param);
3777
3778   /* When we have profile feedback, we can quite safely identify hot
3779      edges and for those we disable size limits.  Don't do that when
3780      probability that caller will call the callee is low however, since it
3781      may hurt optimization of the caller's hot path.  */
3782   if (edge->count && edge->maybe_hot_p ()
3783       && (edge->count * 2
3784           > (edge->caller->global.inlined_to
3785              ? edge->caller->global.inlined_to->count : edge->caller->count)))
3786     hints |= INLINE_HINT_known_hot;
3787
3788   known_vals.release ();
3789   known_contexts.release ();
3790   known_aggs.release ();
3791   gcc_checking_assert (size >= 0);
3792   gcc_checking_assert (time >= 0);
3793
3794   /* When caching, update the cache entry.  */
3795   if (edge_growth_cache.exists ())
3796     {
3797       inline_summaries->get (edge->callee)->min_size = min_size;
3798       if ((int) edge_growth_cache.length () <= edge->uid)
3799         edge_growth_cache.safe_grow_cleared (symtab->edges_max_uid);
3800       edge_growth_cache[edge->uid].time = time + (time >= 0);
3801
3802       edge_growth_cache[edge->uid].size = size + (size >= 0);
3803       hints |= simple_edge_hints (edge);
3804       edge_growth_cache[edge->uid].hints = hints + 1;
3805     }
3806   return time;
3807 }
3808
3809
3810 /* Return estimated callee growth after inlining EDGE.
3811    Only to be called via estimate_edge_size.  */
3812
3813 int
3814 do_estimate_edge_size (struct cgraph_edge *edge)
3815 {
3816   int size;
3817   struct cgraph_node *callee;
3818   clause_t clause;
3819   vec<tree> known_vals;
3820   vec<ipa_polymorphic_call_context> known_contexts;
3821   vec<ipa_agg_jump_function_p> known_aggs;
3822
3823   /* When we do caching, use do_estimate_edge_time to populate the entry.  */
3824
3825   if (edge_growth_cache.exists ())
3826     {
3827       do_estimate_edge_time (edge);
3828       size = edge_growth_cache[edge->uid].size;
3829       gcc_checking_assert (size);
3830       return size - (size > 0);
3831     }
3832
3833   callee = edge->callee->ultimate_alias_target ();
3834
3835   /* Early inliner runs without caching, go ahead and do the dirty work.  */
3836   gcc_checking_assert (edge->inline_failed);
3837   evaluate_properties_for_edge (edge, true,
3838                                 &clause, &known_vals, &known_contexts,
3839                                 &known_aggs);
3840   estimate_node_size_and_time (callee, clause, known_vals, known_contexts,
3841                                known_aggs, &size, NULL, NULL, NULL, vNULL);
3842   known_vals.release ();
3843   known_contexts.release ();
3844   known_aggs.release ();
3845   return size;
3846 }
3847
3848
3849 /* Estimate the growth of the caller when inlining EDGE.
3850    Only to be called via estimate_edge_size.  */
3851
3852 inline_hints
3853 do_estimate_edge_hints (struct cgraph_edge *edge)
3854 {
3855   inline_hints hints;
3856   struct cgraph_node *callee;
3857   clause_t clause;
3858   vec<tree> known_vals;
3859   vec<ipa_polymorphic_call_context> known_contexts;
3860   vec<ipa_agg_jump_function_p> known_aggs;
3861
3862   /* When we do caching, use do_estimate_edge_time to populate the entry.  */
3863
3864   if (edge_growth_cache.exists ())
3865     {
3866       do_estimate_edge_time (edge);
3867       hints = edge_growth_cache[edge->uid].hints;
3868       gcc_checking_assert (hints);
3869       return hints - 1;
3870     }
3871
3872   callee = edge->callee->ultimate_alias_target ();
3873
3874   /* Early inliner runs without caching, go ahead and do the dirty work.  */
3875   gcc_checking_assert (edge->inline_failed);
3876   evaluate_properties_for_edge (edge, true,
3877                                 &clause, &known_vals, &known_contexts,
3878                                 &known_aggs);
3879   estimate_node_size_and_time (callee, clause, known_vals, known_contexts,
3880                                known_aggs, NULL, NULL, NULL, &hints, vNULL);
3881   known_vals.release ();
3882   known_contexts.release ();
3883   known_aggs.release ();
3884   hints |= simple_edge_hints (edge);
3885   return hints;
3886 }
3887
3888
3889 /* Estimate self time of the function NODE after inlining EDGE.  */
3890
3891 int
3892 estimate_time_after_inlining (struct cgraph_node *node,
3893                               struct cgraph_edge *edge)
3894 {
3895   struct inline_edge_summary *es = inline_edge_summary (edge);
3896   if (!es->predicate || !false_predicate_p (es->predicate))
3897     {
3898       gcov_type time =
3899         inline_summaries->get (node)->time + estimate_edge_time (edge);
3900       if (time < 0)
3901         time = 0;
3902       if (time > MAX_TIME)
3903         time = MAX_TIME;
3904       return time;
3905     }
3906   return inline_summaries->get (node)->time;
3907 }
3908
3909
3910 /* Estimate the size of NODE after inlining EDGE which should be an
3911    edge to either NODE or a call inlined into NODE.  */
3912
3913 int
3914 estimate_size_after_inlining (struct cgraph_node *node,
3915                               struct cgraph_edge *edge)
3916 {
3917   struct inline_edge_summary *es = inline_edge_summary (edge);
3918   if (!es->predicate || !false_predicate_p (es->predicate))
3919     {
3920       int size = inline_summaries->get (node)->size + estimate_edge_growth (edge);
3921       gcc_assert (size >= 0);
3922       return size;
3923     }
3924   return inline_summaries->get (node)->size;
3925 }
3926
3927
3928 struct growth_data
3929 {
3930   struct cgraph_node *node;
3931   bool self_recursive;
3932   bool uninlinable;
3933   int growth;
3934 };
3935
3936
3937 /* Worker for do_estimate_growth.  Collect growth for all callers.  */
3938
3939 static bool
3940 do_estimate_growth_1 (struct cgraph_node *node, void *data)
3941 {
3942   struct cgraph_edge *e;
3943   struct growth_data *d = (struct growth_data *) data;
3944
3945   for (e = node->callers; e; e = e->next_caller)
3946     {
3947       gcc_checking_assert (e->inline_failed);
3948
3949       if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
3950         {
3951           d->uninlinable = true;
3952           continue;
3953         }
3954
3955       if (e->recursive_p ())
3956         {
3957           d->self_recursive = true;
3958           continue;
3959         }
3960       d->growth += estimate_edge_growth (e);
3961     }
3962   return false;
3963 }
3964
3965
3966 /* Estimate the growth caused by inlining NODE into all callees.  */
3967
3968 int
3969 estimate_growth (struct cgraph_node *node)
3970 {
3971   struct growth_data d = { node, false, false, 0 };
3972   struct inline_summary *info = inline_summaries->get (node);
3973
3974   node->call_for_symbol_and_aliases (do_estimate_growth_1, &d, true);
3975
3976   /* For self recursive functions the growth estimation really should be
3977      infinity.  We don't want to return very large values because the growth
3978      plays various roles in badness computation fractions.  Be sure to not
3979      return zero or negative growths. */
3980   if (d.self_recursive)
3981     d.growth = d.growth < info->size ? info->size : d.growth;
3982   else if (DECL_EXTERNAL (node->decl) || d.uninlinable)
3983     ;
3984   else
3985     {
3986       if (node->will_be_removed_from_program_if_no_direct_calls_p ())
3987         d.growth -= info->size;
3988       /* COMDAT functions are very often not shared across multiple units
3989          since they come from various template instantiations.
3990          Take this into account.  */
3991       else if (DECL_COMDAT (node->decl)
3992                && node->can_remove_if_no_direct_calls_p ())
3993         d.growth -= (info->size
3994                      * (100 - PARAM_VALUE (PARAM_COMDAT_SHARING_PROBABILITY))
3995                      + 50) / 100;
3996     }
3997
3998   return d.growth;
3999 }
4000
4001 /* Verify if there are fewer than MAX_CALLERS.  */
4002
4003 static bool
4004 check_callers (cgraph_node *node, int *max_callers)
4005 {
4006   ipa_ref *ref;
4007
4008   if (!node->can_remove_if_no_direct_calls_and_refs_p ())
4009     return true;
4010
4011   for (cgraph_edge *e = node->callers; e; e = e->next_caller)
4012     {
4013       (*max_callers)--;
4014       if (!*max_callers
4015           || cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
4016         return true;
4017     }
4018
4019   FOR_EACH_ALIAS (node, ref)
4020     if (check_callers (dyn_cast <cgraph_node *> (ref->referring), max_callers))
4021       return true;
4022
4023   return false;
4024 }
4025
4026
4027 /* Make cheap estimation if growth of NODE is likely positive knowing
4028    EDGE_GROWTH of one particular edge.
4029    We assume that most of other edges will have similar growth
4030    and skip computation if there are too many callers.  */
4031
4032 bool
4033 growth_likely_positive (struct cgraph_node *node,
4034                         int edge_growth)
4035 {
4036   int max_callers;
4037   struct cgraph_edge *e;
4038   gcc_checking_assert (edge_growth > 0);
4039
4040   /* First quickly check if NODE is removable at all.  */
4041   if (DECL_EXTERNAL (node->decl))
4042     return true;
4043   if (!node->can_remove_if_no_direct_calls_and_refs_p ()
4044       || node->address_taken)
4045     return true;
4046
4047   max_callers = inline_summaries->get (node)->size * 4 / edge_growth + 2;
4048
4049   for (e = node->callers; e; e = e->next_caller)
4050     {
4051       max_callers--;
4052       if (!max_callers
4053           || cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
4054         return true;
4055     }
4056
4057   ipa_ref *ref;
4058   FOR_EACH_ALIAS (node, ref)
4059     if (check_callers (dyn_cast <cgraph_node *> (ref->referring), &max_callers))
4060       return true;
4061
4062   /* Unlike for functions called once, we play unsafe with
4063      COMDATs.  We can allow that since we know functions
4064      in consideration are small (and thus risk is small) and
4065      moreover grow estimates already accounts that COMDAT
4066      functions may or may not disappear when eliminated from
4067      current unit. With good probability making aggressive
4068      choice in all units is going to make overall program
4069      smaller.  */
4070   if (DECL_COMDAT (node->decl))
4071     {
4072       if (!node->can_remove_if_no_direct_calls_p ())
4073         return true;
4074     }
4075   else if (!node->will_be_removed_from_program_if_no_direct_calls_p ())
4076     return true;
4077
4078   return estimate_growth (node) > 0;
4079 }
4080
4081
4082 /* This function performs intraprocedural analysis in NODE that is required to
4083    inline indirect calls.  */
4084
4085 static void
4086 inline_indirect_intraprocedural_analysis (struct cgraph_node *node)
4087 {
4088   ipa_analyze_node (node);
4089   if (dump_file && (dump_flags & TDF_DETAILS))
4090     {
4091       ipa_print_node_params (dump_file, node);
4092       ipa_print_node_jump_functions (dump_file, node);
4093     }
4094 }
4095
4096
4097 /* Note function body size.  */
4098
4099 void
4100 inline_analyze_function (struct cgraph_node *node)
4101 {
4102   push_cfun (DECL_STRUCT_FUNCTION (node->decl));
4103
4104   if (dump_file)
4105     fprintf (dump_file, "\nAnalyzing function: %s/%u\n",
4106              node->name (), node->order);
4107   if (opt_for_fn (node->decl, optimize) && !node->thunk.thunk_p)
4108     inline_indirect_intraprocedural_analysis (node);
4109   compute_inline_parameters (node, false);
4110   if (!optimize)
4111     {
4112       struct cgraph_edge *e;
4113       for (e = node->callees; e; e = e->next_callee)
4114         e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
4115       for (e = node->indirect_calls; e; e = e->next_callee)
4116         e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
4117     }
4118
4119   pop_cfun ();
4120 }
4121
4122
4123 /* Called when new function is inserted to callgraph late.  */
4124
4125 void
4126 inline_summary_t::insert (struct cgraph_node *node, inline_summary *)
4127 {
4128   inline_analyze_function (node);
4129 }
4130
4131 /* Note function body size.  */
4132
4133 void
4134 inline_generate_summary (void)
4135 {
4136   struct cgraph_node *node;
4137
4138   FOR_EACH_DEFINED_FUNCTION (node)
4139     if (DECL_STRUCT_FUNCTION (node->decl))
4140       node->local.versionable = tree_versionable_function_p (node->decl);
4141
4142   /* When not optimizing, do not bother to analyze.  Inlining is still done
4143      because edge redirection needs to happen there.  */
4144   if (!optimize && !flag_generate_lto && !flag_generate_offload && !flag_wpa)
4145     return;
4146
4147   if (!inline_summaries)
4148     inline_summaries = (inline_summary_t*) inline_summary_t::create_ggc (symtab);
4149
4150   inline_summaries->enable_insertion_hook ();
4151
4152   ipa_register_cgraph_hooks ();
4153   inline_free_summary ();
4154
4155   FOR_EACH_DEFINED_FUNCTION (node)
4156     if (!node->alias)
4157       inline_analyze_function (node);
4158 }
4159
4160
4161 /* Read predicate from IB.  */
4162
4163 static struct predicate
4164 read_predicate (struct lto_input_block *ib)
4165 {
4166   struct predicate out;
4167   clause_t clause;
4168   int k = 0;
4169
4170   do
4171     {
4172       gcc_assert (k <= MAX_CLAUSES);
4173       clause = out.clause[k++] = streamer_read_uhwi (ib);
4174     }
4175   while (clause);
4176
4177   /* Zero-initialize the remaining clauses in OUT.  */
4178   while (k <= MAX_CLAUSES)
4179     out.clause[k++] = 0;
4180
4181   return out;
4182 }
4183
4184
4185 /* Write inline summary for edge E to OB.  */
4186
4187 static void
4188 read_inline_edge_summary (struct lto_input_block *ib, struct cgraph_edge *e)
4189 {
4190   struct inline_edge_summary *es = inline_edge_summary (e);
4191   struct predicate p;
4192   int length, i;
4193
4194   es->call_stmt_size = streamer_read_uhwi (ib);
4195   es->call_stmt_time = streamer_read_uhwi (ib);
4196   es->loop_depth = streamer_read_uhwi (ib);
4197   p = read_predicate (ib);
4198   edge_set_predicate (e, &p);
4199   length = streamer_read_uhwi (ib);
4200   if (length)
4201     {
4202       es->param.safe_grow_cleared (length);
4203       for (i = 0; i < length; i++)
4204         es->param[i].change_prob = streamer_read_uhwi (ib);
4205     }
4206 }
4207
4208
4209 /* Stream in inline summaries from the section.  */
4210
4211 static void
4212 inline_read_section (struct lto_file_decl_data *file_data, const char *data,
4213                      size_t len)
4214 {
4215   const struct lto_function_header *header =
4216     (const struct lto_function_header *) data;
4217   const int cfg_offset = sizeof (struct lto_function_header);
4218   const int main_offset = cfg_offset + header->cfg_size;
4219   const int string_offset = main_offset + header->main_size;
4220   struct data_in *data_in;
4221   unsigned int i, count2, j;
4222   unsigned int f_count;
4223
4224   lto_input_block ib ((const char *) data + main_offset, header->main_size,
4225                       file_data->mode_table);
4226
4227   data_in =
4228     lto_data_in_create (file_data, (const char *) data + string_offset,
4229                         header->string_size, vNULL);
4230   f_count = streamer_read_uhwi (&ib);
4231   for (i = 0; i < f_count; i++)
4232     {
4233       unsigned int index;
4234       struct cgraph_node *node;
4235       struct inline_summary *info;
4236       lto_symtab_encoder_t encoder;
4237       struct bitpack_d bp;
4238       struct cgraph_edge *e;
4239       predicate p;
4240
4241       index = streamer_read_uhwi (&ib);
4242       encoder = file_data->symtab_node_encoder;
4243       node = dyn_cast<cgraph_node *> (lto_symtab_encoder_deref (encoder,
4244                                                                 index));
4245       info = inline_summaries->get (node);
4246
4247       info->estimated_stack_size
4248         = info->estimated_self_stack_size = streamer_read_uhwi (&ib);
4249       info->size = info->self_size = streamer_read_uhwi (&ib);
4250       info->time = info->self_time = streamer_read_uhwi (&ib);
4251
4252       bp = streamer_read_bitpack (&ib);
4253       info->inlinable = bp_unpack_value (&bp, 1);
4254       info->contains_cilk_spawn = bp_unpack_value (&bp, 1);
4255       info->fp_expressions = bp_unpack_value (&bp, 1);
4256
4257       count2 = streamer_read_uhwi (&ib);
4258       gcc_assert (!info->conds);
4259       for (j = 0; j < count2; j++)
4260         {
4261           struct condition c;
4262           c.operand_num = streamer_read_uhwi (&ib);
4263           c.code = (enum tree_code) streamer_read_uhwi (&ib);
4264           c.val = stream_read_tree (&ib, data_in);
4265           bp = streamer_read_bitpack (&ib);
4266           c.agg_contents = bp_unpack_value (&bp, 1);
4267           c.by_ref = bp_unpack_value (&bp, 1);
4268           if (c.agg_contents)
4269             c.offset = streamer_read_uhwi (&ib);
4270           vec_safe_push (info->conds, c);
4271         }
4272       count2 = streamer_read_uhwi (&ib);
4273       gcc_assert (!info->entry);
4274       for (j = 0; j < count2; j++)
4275         {
4276           struct size_time_entry e;
4277
4278           e.size = streamer_read_uhwi (&ib);
4279           e.time = streamer_read_uhwi (&ib);
4280           e.predicate = read_predicate (&ib);
4281
4282           vec_safe_push (info->entry, e);
4283         }
4284
4285       p = read_predicate (&ib);
4286       set_hint_predicate (&info->loop_iterations, p);
4287       p = read_predicate (&ib);
4288       set_hint_predicate (&info->loop_stride, p);
4289       p = read_predicate (&ib);
4290       set_hint_predicate (&info->array_index, p);
4291       for (e = node->callees; e; e = e->next_callee)
4292         read_inline_edge_summary (&ib, e);
4293       for (e = node->indirect_calls; e; e = e->next_callee)
4294         read_inline_edge_summary (&ib, e);
4295     }
4296
4297   lto_free_section_data (file_data, LTO_section_inline_summary, NULL, data,
4298                          len);
4299   lto_data_in_delete (data_in);
4300 }
4301
4302
4303 /* Read inline summary.  Jump functions are shared among ipa-cp
4304    and inliner, so when ipa-cp is active, we don't need to write them
4305    twice.  */
4306
4307 void
4308 inline_read_summary (void)
4309 {
4310   struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
4311   struct lto_file_decl_data *file_data;
4312   unsigned int j = 0;
4313
4314   inline_summary_alloc ();
4315
4316   while ((file_data = file_data_vec[j++]))
4317     {
4318       size_t len;
4319       const char *data = lto_get_section_data (file_data,
4320                                                LTO_section_inline_summary,
4321                                                NULL, &len);
4322       if (data)
4323         inline_read_section (file_data, data, len);
4324       else
4325         /* Fatal error here.  We do not want to support compiling ltrans units
4326            with different version of compiler or different flags than the WPA
4327            unit, so this should never happen.  */
4328         fatal_error (input_location,
4329                      "ipa inline summary is missing in input file");
4330     }
4331   if (optimize)
4332     {
4333       ipa_register_cgraph_hooks ();
4334       if (!flag_ipa_cp)
4335         ipa_prop_read_jump_functions ();
4336     }
4337
4338   gcc_assert (inline_summaries);
4339   inline_summaries->enable_insertion_hook ();
4340 }
4341
4342
4343 /* Write predicate P to OB.  */
4344
4345 static void
4346 write_predicate (struct output_block *ob, struct predicate *p)
4347 {
4348   int j;
4349   if (p)
4350     for (j = 0; p->clause[j]; j++)
4351       {
4352         gcc_assert (j < MAX_CLAUSES);
4353         streamer_write_uhwi (ob, p->clause[j]);
4354       }
4355   streamer_write_uhwi (ob, 0);
4356 }
4357
4358
4359 /* Write inline summary for edge E to OB.  */
4360
4361 static void
4362 write_inline_edge_summary (struct output_block *ob, struct cgraph_edge *e)
4363 {
4364   struct inline_edge_summary *es = inline_edge_summary (e);
4365   int i;
4366
4367   streamer_write_uhwi (ob, es->call_stmt_size);
4368   streamer_write_uhwi (ob, es->call_stmt_time);
4369   streamer_write_uhwi (ob, es->loop_depth);
4370   write_predicate (ob, es->predicate);
4371   streamer_write_uhwi (ob, es->param.length ());
4372   for (i = 0; i < (int) es->param.length (); i++)
4373     streamer_write_uhwi (ob, es->param[i].change_prob);
4374 }
4375
4376
4377 /* Write inline summary for node in SET.
4378    Jump functions are shared among ipa-cp and inliner, so when ipa-cp is
4379    active, we don't need to write them twice.  */
4380
4381 void
4382 inline_write_summary (void)
4383 {
4384   struct cgraph_node *node;
4385   struct output_block *ob = create_output_block (LTO_section_inline_summary);
4386   lto_symtab_encoder_t encoder = ob->decl_state->symtab_node_encoder;
4387   unsigned int count = 0;
4388   int i;
4389
4390   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4391     {
4392       symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
4393       cgraph_node *cnode = dyn_cast <cgraph_node *> (snode);
4394       if (cnode && cnode->definition && !cnode->alias)
4395         count++;
4396     }
4397   streamer_write_uhwi (ob, count);
4398
4399   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4400     {
4401       symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
4402       cgraph_node *cnode = dyn_cast <cgraph_node *> (snode);
4403       if (cnode && (node = cnode)->definition && !node->alias)
4404         {
4405           struct inline_summary *info = inline_summaries->get (node);
4406           struct bitpack_d bp;
4407           struct cgraph_edge *edge;
4408           int i;
4409           size_time_entry *e;
4410           struct condition *c;
4411
4412           streamer_write_uhwi (ob,
4413                                lto_symtab_encoder_encode (encoder,
4414
4415                                                           node));
4416           streamer_write_hwi (ob, info->estimated_self_stack_size);
4417           streamer_write_hwi (ob, info->self_size);
4418           streamer_write_hwi (ob, info->self_time);
4419           bp = bitpack_create (ob->main_stream);
4420           bp_pack_value (&bp, info->inlinable, 1);
4421           bp_pack_value (&bp, info->contains_cilk_spawn, 1);
4422           bp_pack_value (&bp, info->fp_expressions, 1);
4423           streamer_write_bitpack (&bp);
4424           streamer_write_uhwi (ob, vec_safe_length (info->conds));
4425           for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
4426             {
4427               streamer_write_uhwi (ob, c->operand_num);
4428               streamer_write_uhwi (ob, c->code);
4429               stream_write_tree (ob, c->val, true);
4430               bp = bitpack_create (ob->main_stream);
4431               bp_pack_value (&bp, c->agg_contents, 1);
4432               bp_pack_value (&bp, c->by_ref, 1);
4433               streamer_write_bitpack (&bp);
4434               if (c->agg_contents)
4435                 streamer_write_uhwi (ob, c->offset);
4436             }
4437           streamer_write_uhwi (ob, vec_safe_length (info->entry));
4438           for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
4439             {
4440               streamer_write_uhwi (ob, e->size);
4441               streamer_write_uhwi (ob, e->time);
4442               write_predicate (ob, &e->predicate);
4443             }
4444           write_predicate (ob, info->loop_iterations);
4445           write_predicate (ob, info->loop_stride);
4446           write_predicate (ob, info->array_index);
4447           for (edge = node->callees; edge; edge = edge->next_callee)
4448             write_inline_edge_summary (ob, edge);
4449           for (edge = node->indirect_calls; edge; edge = edge->next_callee)
4450             write_inline_edge_summary (ob, edge);
4451         }
4452     }
4453   streamer_write_char_stream (ob->main_stream, 0);
4454   produce_asm (ob, NULL);
4455   destroy_output_block (ob);
4456
4457   if (optimize && !flag_ipa_cp)
4458     ipa_prop_write_jump_functions ();
4459 }
4460
4461
4462 /* Release inline summary.  */
4463
4464 void
4465 inline_free_summary (void)
4466 {
4467   struct cgraph_node *node;
4468   if (edge_removal_hook_holder)
4469     symtab->remove_edge_removal_hook (edge_removal_hook_holder);
4470   edge_removal_hook_holder = NULL;
4471   if (edge_duplication_hook_holder)
4472     symtab->remove_edge_duplication_hook (edge_duplication_hook_holder);
4473   edge_duplication_hook_holder = NULL;
4474   if (!inline_edge_summary_vec.exists ())
4475     return;
4476   FOR_EACH_DEFINED_FUNCTION (node)
4477     if (!node->alias)
4478       reset_inline_summary (node, inline_summaries->get (node));
4479   inline_summaries->release ();
4480   inline_summaries = NULL;
4481   inline_edge_summary_vec.release ();
4482   edge_predicate_pool.release ();
4483 }