gcc/ipa-inline-analysis.c

   1 /* Inlining decision heuristics.
   2    Copyright (C) 2003-2013 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* Analysis used by the inliner and other passes limiting code size growth.
  22
  23    We estimate for each function
  24      - function body size
  25      - average function execution time
  26      - inlining size benefit (that is how much of function body size
  27        and its call sequence is expected to disappear by inlining)
  28      - inlining time benefit
  29      - function frame size
  30    For each call
  31      - call statement size and time
  32
  33    inlinie_summary datastructures store above information locally (i.e.
  34    parameters of the function itself) and globally (i.e. parameters of
  35    the function created by applying all the inline decisions already
  36    present in the callgraph).
  37
  38    We provide accestor to the inline_summary datastructure and
  39    basic logic updating the parameters when inlining is performed.
  40
  41    The summaries are context sensitive.  Context means
  42      1) partial assignment of known constant values of operands
  43      2) whether function is inlined into the call or not.
  44    It is easy to add more variants.  To represent function size and time
  45    that depends on context (i.e. it is known to be optimized away when
  46    context is known either by inlining or from IP-CP and clonning),
  47    we use predicates. Predicates are logical formulas in
  48    conjunctive-disjunctive form consisting of clauses. Clauses are bitmaps
  49    specifying what conditions must be true. Conditions are simple test
  50    of the form described above.
  51
  52    In order to make predicate (possibly) true, all of its clauses must
  53    be (possibly) true. To make clause (possibly) true, one of conditions
  54    it mentions must be (possibly) true.  There are fixed bounds on
  55    number of clauses and conditions and all the manipulation functions
  56    are conservative in positive direction. I.e. we may lose precision
  57    by thinking that predicate may be true even when it is not.
  58
  59    estimate_edge_size and estimate_edge_growth can be used to query
  60    function size/time in the given context.  inline_merge_summary merges
  61    properties of caller and callee after inlining.
  62
  63    Finally pass_inline_parameters is exported.  This is used to drive
  64    computation of function parameters used by the early inliner. IPA
  65    inlined performs analysis via its analyze_function method. */
  66
  67 #include "config.h"
  68 #include "system.h"
  69 #include "coretypes.h"
  70 #include "tm.h"
  71 #include "tree.h"
  72 #include "tree-inline.h"
  73 #include "langhooks.h"
  74 #include "flags.h"
  75 #include "diagnostic.h"
  76 #include "gimple-pretty-print.h"
  77 #include "params.h"
  78 #include "tree-pass.h"
  79 #include "coverage.h"
  80 #include "ggc.h"
  81 #include "gimple.h"
  82 #include "gimple-ssa.h"
  83 #include "tree-cfg.h"
  84 #include "tree-phinodes.h"
  85 #include "ssa-iterators.h"
  86 #include "tree-ssanames.h"
  87 #include "tree-ssa-loop-niter.h"
  88 #include "tree-ssa-loop.h"
  89 #include "ipa-prop.h"
  90 #include "lto-streamer.h"
  91 #include "data-streamer.h"
  92 #include "tree-streamer.h"
  93 #include "ipa-inline.h"
  94 #include "alloc-pool.h"
  95 #include "cfgloop.h"
  96 #include "tree-scalar-evolution.h"
  97 #include "ipa-utils.h"
  98
  99 /* Estimate runtime of function can easilly run into huge numbers with many
 100    nested loops.  Be sure we can compute time * INLINE_SIZE_SCALE * 2 in an
 101    integer.  For anything larger we use gcov_type.  */
 102 #define MAX_TIME 500000
 103
 104 /* Number of bits in integer, but we really want to be stable across different
 105    hosts.  */
 106 #define NUM_CONDITIONS 32
 107
 108 enum predicate_conditions
 109 {
 110   predicate_false_condition = 0,
 111   predicate_not_inlined_condition = 1,
 112   predicate_first_dynamic_condition = 2
 113 };
 114
 115 /* Special condition code we use to represent test that operand is compile time
 116    constant.  */
 117 #define IS_NOT_CONSTANT ERROR_MARK
 118 /* Special condition code we use to represent test that operand is not changed
 119    across invocation of the function.  When operand IS_NOT_CONSTANT it is always
 120    CHANGED, however i.e. loop invariants can be NOT_CHANGED given percentage
 121    of executions even when they are not compile time constants.  */
 122 #define CHANGED IDENTIFIER_NODE
 123
 124 /* Holders of ipa cgraph hooks: */
 125 static struct cgraph_node_hook_list *function_insertion_hook_holder;
 126 static struct cgraph_node_hook_list *node_removal_hook_holder;
 127 static struct cgraph_2node_hook_list *node_duplication_hook_holder;
 128 static struct cgraph_2edge_hook_list *edge_duplication_hook_holder;
 129 static struct cgraph_edge_hook_list *edge_removal_hook_holder;
 130 static void inline_node_removal_hook (struct cgraph_node *, void *);
 131 static void inline_node_duplication_hook (struct cgraph_node *,
 132                                           struct cgraph_node *, void *);
 133 static void inline_edge_removal_hook (struct cgraph_edge *, void *);
 134 static void inline_edge_duplication_hook (struct cgraph_edge *,
 135                                           struct cgraph_edge *, void *);
 136
 137 /* VECtor holding inline summaries.
 138    In GGC memory because conditions might point to constant trees.  */
 139 vec<inline_summary_t, va_gc> *inline_summary_vec;
 140 vec<inline_edge_summary_t> inline_edge_summary_vec;
 141
 142 /* Cached node/edge growths.  */
 143 vec<int> node_growth_cache;
 144 vec<edge_growth_cache_entry> edge_growth_cache;
 145
 146 /* Edge predicates goes here.  */
 147 static alloc_pool edge_predicate_pool;
 148
 149 /* Return true predicate (tautology).
 150    We represent it by empty list of clauses.  */
 151
 152 static inline struct predicate
 153 true_predicate (void)
 154 {
 155   struct predicate p;
 156   p.clause[0] = 0;
 157   return p;
 158 }
 159
 160
 161 /* Return predicate testing single condition number COND.  */
 162
 163 static inline struct predicate
 164 single_cond_predicate (int cond)
 165 {
 166   struct predicate p;
 167   p.clause[0] = 1 << cond;
 168   p.clause[1] = 0;
 169   return p;
 170 }
 171
 172
 173 /* Return false predicate.  First clause require false condition.  */
 174
 175 static inline struct predicate
 176 false_predicate (void)
 177 {
 178   return single_cond_predicate (predicate_false_condition);
 179 }
 180
 181
 182 /* Return true if P is (false).  */
 183
 184 static inline bool
 185 true_predicate_p (struct predicate *p)
 186 {
 187   return !p->clause[0];
 188 }
 189
 190
 191 /* Return true if P is (false).  */
 192
 193 static inline bool
 194 false_predicate_p (struct predicate *p)
 195 {
 196   if (p->clause[0] == (1 << predicate_false_condition))
 197     {
 198       gcc_checking_assert (!p->clause[1]
 199                            && p->clause[0] == 1 << predicate_false_condition);
 200       return true;
 201     }
 202   return false;
 203 }
 204
 205
 206 /* Return predicate that is set true when function is not inlined.  */
 207
 208 static inline struct predicate
 209 not_inlined_predicate (void)
 210 {
 211   return single_cond_predicate (predicate_not_inlined_condition);
 212 }
 213
 214 /* Simple description of whether a memory load or a condition refers to a load
 215    from an aggregate and if so, how and where from in the aggregate.
 216    Individual fields have the same meaning like fields with the same name in
 217    struct condition.  */
 218
 219 struct agg_position_info
 220 {
 221   HOST_WIDE_INT offset;
 222   bool agg_contents;
 223   bool by_ref;
 224 };
 225
 226 /* Add condition to condition list CONDS.  AGGPOS describes whether the used
 227    oprand is loaded from an aggregate and where in the aggregate it is.  It can
 228    be NULL, which means this not a load from an aggregate.  */
 229
 230 static struct predicate
 231 add_condition (struct inline_summary *summary, int operand_num,
 232                struct agg_position_info *aggpos,
 233                enum tree_code code, tree val)
 234 {
 235   int i;
 236   struct condition *c;
 237   struct condition new_cond;
 238   HOST_WIDE_INT offset;
 239   bool agg_contents, by_ref;
 240
 241   if (aggpos)
 242     {
 243       offset = aggpos->offset;
 244       agg_contents = aggpos->agg_contents;
 245       by_ref = aggpos->by_ref;
 246     }
 247   else
 248     {
 249       offset = 0;
 250       agg_contents = false;
 251       by_ref = false;
 252     }
 253
 254   gcc_checking_assert (operand_num >= 0);
 255   for (i = 0; vec_safe_iterate (summary->conds, i, &c); i++)
 256     {
 257       if (c->operand_num == operand_num
 258           && c->code == code
 259           && c->val == val
 260           && c->agg_contents == agg_contents
 261           && (!agg_contents || (c->offset == offset && c->by_ref == by_ref)))
 262         return single_cond_predicate (i + predicate_first_dynamic_condition);
 263     }
 264   /* Too many conditions.  Give up and return constant true.  */
 265   if (i == NUM_CONDITIONS - predicate_first_dynamic_condition)
 266     return true_predicate ();
 267
 268   new_cond.operand_num = operand_num;
 269   new_cond.code = code;
 270   new_cond.val = val;
 271   new_cond.agg_contents = agg_contents;
 272   new_cond.by_ref = by_ref;
 273   new_cond.offset = offset;
 274   vec_safe_push (summary->conds, new_cond);
 275   return single_cond_predicate (i + predicate_first_dynamic_condition);
 276 }
 277
 278
 279 /* Add clause CLAUSE into the predicate P.  */
 280
 281 static inline void
 282 add_clause (conditions conditions, struct predicate *p, clause_t clause)
 283 {
 284   int i;
 285   int i2;
 286   int insert_here = -1;
 287   int c1, c2;
 288
 289   /* True clause.  */
 290   if (!clause)
 291     return;
 292
 293   /* False clause makes the whole predicate false.  Kill the other variants.  */
 294   if (clause == (1 << predicate_false_condition))
 295     {
 296       p->clause[0] = (1 << predicate_false_condition);
 297       p->clause[1] = 0;
 298       return;
 299     }
 300   if (false_predicate_p (p))
 301     return;
 302
 303   /* No one should be sily enough to add false into nontrivial clauses.  */
 304   gcc_checking_assert (!(clause & (1 << predicate_false_condition)));
 305
 306   /* Look where to insert the clause.  At the same time prune out
 307      clauses of P that are implied by the new clause and thus
 308      redundant.  */
 309   for (i = 0, i2 = 0; i <= MAX_CLAUSES; i++)
 310     {
 311       p->clause[i2] = p->clause[i];
 312
 313       if (!p->clause[i])
 314         break;
 315
 316       /* If p->clause[i] implies clause, there is nothing to add.  */
 317       if ((p->clause[i] & clause) == p->clause[i])
 318         {
 319           /* We had nothing to add, none of clauses should've become
 320              redundant.  */
 321           gcc_checking_assert (i == i2);
 322           return;
 323         }
 324
 325       if (p->clause[i] < clause && insert_here < 0)
 326         insert_here = i2;
 327
 328       /* If clause implies p->clause[i], then p->clause[i] becomes redundant.
 329          Otherwise the p->clause[i] has to stay.  */
 330       if ((p->clause[i] & clause) != clause)
 331         i2++;
 332     }
 333
 334   /* Look for clauses that are obviously true.  I.e.
 335      op0 == 5 || op0 != 5.  */
 336   for (c1 = predicate_first_dynamic_condition; c1 < NUM_CONDITIONS; c1++)
 337     {
 338       condition *cc1;
 339       if (!(clause & (1 << c1)))
 340         continue;
 341       cc1 = &(*conditions)[c1 - predicate_first_dynamic_condition];
 342       /* We have no way to represent !CHANGED and !IS_NOT_CONSTANT
 343          and thus there is no point for looking for them.  */
 344       if (cc1->code == CHANGED || cc1->code == IS_NOT_CONSTANT)
 345         continue;
 346       for (c2 = c1 + 1; c2 < NUM_CONDITIONS; c2++)
 347         if (clause & (1 << c2))
 348           {
 349             condition *cc1 =
 350               &(*conditions)[c1 - predicate_first_dynamic_condition];
 351             condition *cc2 =
 352               &(*conditions)[c2 - predicate_first_dynamic_condition];
 353             if (cc1->operand_num == cc2->operand_num
 354                 && cc1->val == cc2->val
 355                 && cc2->code != IS_NOT_CONSTANT
 356                 && cc2->code != CHANGED
 357                 && cc1->code == invert_tree_comparison
 358                                 (cc2->code,
 359                                  HONOR_NANS (TYPE_MODE (TREE_TYPE (cc1->val)))))
 360               return;
 361           }
 362     }
 363
 364
 365   /* We run out of variants.  Be conservative in positive direction.  */
 366   if (i2 == MAX_CLAUSES)
 367     return;
 368   /* Keep clauses in decreasing order. This makes equivalence testing easy.  */
 369   p->clause[i2 + 1] = 0;
 370   if (insert_here >= 0)
 371     for (; i2 > insert_here; i2--)
 372       p->clause[i2] = p->clause[i2 - 1];
 373   else
 374     insert_here = i2;
 375   p->clause[insert_here] = clause;
 376 }
 377
 378
 379 /* Return P & P2.  */
 380
 381 static struct predicate
 382 and_predicates (conditions conditions,
 383                 struct predicate *p, struct predicate *p2)
 384 {
 385   struct predicate out = *p;
 386   int i;
 387
 388   /* Avoid busy work.  */
 389   if (false_predicate_p (p2) || true_predicate_p (p))
 390     return *p2;
 391   if (false_predicate_p (p) || true_predicate_p (p2))
 392     return *p;
 393
 394   /* See how far predicates match.  */
 395   for (i = 0; p->clause[i] && p->clause[i] == p2->clause[i]; i++)
 396     {
 397       gcc_checking_assert (i < MAX_CLAUSES);
 398     }
 399
 400   /* Combine the predicates rest.  */
 401   for (; p2->clause[i]; i++)
 402     {
 403       gcc_checking_assert (i < MAX_CLAUSES);
 404       add_clause (conditions, &out, p2->clause[i]);
 405     }
 406   return out;
 407 }
 408
 409
 410 /* Return true if predicates are obviously equal.  */
 411
 412 static inline bool
 413 predicates_equal_p (struct predicate *p, struct predicate *p2)
 414 {
 415   int i;
 416   for (i = 0; p->clause[i]; i++)
 417     {
 418       gcc_checking_assert (i < MAX_CLAUSES);
 419       gcc_checking_assert (p->clause[i] > p->clause[i + 1]);
 420       gcc_checking_assert (!p2->clause[i]
 421                            || p2->clause[i] > p2->clause[i + 1]);
 422       if (p->clause[i] != p2->clause[i])
 423         return false;
 424     }
 425   return !p2->clause[i];
 426 }
 427
 428
 429 /* Return P | P2.  */
 430
 431 static struct predicate
 432 or_predicates (conditions conditions,
 433                struct predicate *p, struct predicate *p2)
 434 {
 435   struct predicate out = true_predicate ();
 436   int i, j;
 437
 438   /* Avoid busy work.  */
 439   if (false_predicate_p (p2) || true_predicate_p (p))
 440     return *p;
 441   if (false_predicate_p (p) || true_predicate_p (p2))
 442     return *p2;
 443   if (predicates_equal_p (p, p2))
 444     return *p;
 445
 446   /* OK, combine the predicates.  */
 447   for (i = 0; p->clause[i]; i++)
 448     for (j = 0; p2->clause[j]; j++)
 449       {
 450         gcc_checking_assert (i < MAX_CLAUSES && j < MAX_CLAUSES);
 451         add_clause (conditions, &out, p->clause[i] | p2->clause[j]);
 452       }
 453   return out;
 454 }
 455
 456
 457 /* Having partial truth assignment in POSSIBLE_TRUTHS, return false
 458    if predicate P is known to be false.  */
 459
 460 static bool
 461 evaluate_predicate (struct predicate *p, clause_t possible_truths)
 462 {
 463   int i;
 464
 465   /* True remains true.  */
 466   if (true_predicate_p (p))
 467     return true;
 468
 469   gcc_assert (!(possible_truths & (1 << predicate_false_condition)));
 470
 471   /* See if we can find clause we can disprove.  */
 472   for (i = 0; p->clause[i]; i++)
 473     {
 474       gcc_checking_assert (i < MAX_CLAUSES);
 475       if (!(p->clause[i] & possible_truths))
 476         return false;
 477     }
 478   return true;
 479 }
 480
 481 /* Return the probability in range 0...REG_BR_PROB_BASE that the predicated
 482    instruction will be recomputed per invocation of the inlined call.  */
 483
 484 static int
 485 predicate_probability (conditions conds,
 486                        struct predicate *p, clause_t possible_truths,
 487                        vec<inline_param_summary_t> inline_param_summary)
 488 {
 489   int i;
 490   int combined_prob = REG_BR_PROB_BASE;
 491
 492   /* True remains true.  */
 493   if (true_predicate_p (p))
 494     return REG_BR_PROB_BASE;
 495
 496   if (false_predicate_p (p))
 497     return 0;
 498
 499   gcc_assert (!(possible_truths & (1 << predicate_false_condition)));
 500
 501   /* See if we can find clause we can disprove.  */
 502   for (i = 0; p->clause[i]; i++)
 503     {
 504       gcc_checking_assert (i < MAX_CLAUSES);
 505       if (!(p->clause[i] & possible_truths))
 506         return 0;
 507       else
 508         {
 509           int this_prob = 0;
 510           int i2;
 511           if (!inline_param_summary.exists ())
 512             return REG_BR_PROB_BASE;
 513           for (i2 = 0; i2 < NUM_CONDITIONS; i2++)
 514             if ((p->clause[i] & possible_truths) & (1 << i2))
 515               {
 516                 if (i2 >= predicate_first_dynamic_condition)
 517                   {
 518                     condition *c =
 519                       &(*conds)[i2 - predicate_first_dynamic_condition];
 520                     if (c->code == CHANGED
 521                         && (c->operand_num <
 522                             (int) inline_param_summary.length ()))
 523                       {
 524                         int iprob =
 525                           inline_param_summary[c->operand_num].change_prob;
 526                         this_prob = MAX (this_prob, iprob);
 527                       }
 528                     else
 529                       this_prob = REG_BR_PROB_BASE;
 530                   }
 531                 else
 532                   this_prob = REG_BR_PROB_BASE;
 533               }
 534           combined_prob = MIN (this_prob, combined_prob);
 535           if (!combined_prob)
 536             return 0;
 537         }
 538     }
 539   return combined_prob;
 540 }
 541
 542
 543 /* Dump conditional COND.  */
 544
 545 static void
 546 dump_condition (FILE *f, conditions conditions, int cond)
 547 {
 548   condition *c;
 549   if (cond == predicate_false_condition)
 550     fprintf (f, "false");
 551   else if (cond == predicate_not_inlined_condition)
 552     fprintf (f, "not inlined");
 553   else
 554     {
 555       c = &(*conditions)[cond - predicate_first_dynamic_condition];
 556       fprintf (f, "op%i", c->operand_num);
 557       if (c->agg_contents)
 558         fprintf (f, "[%soffset: " HOST_WIDE_INT_PRINT_DEC "]",
 559                  c->by_ref ? "ref " : "", c->offset);
 560       if (c->code == IS_NOT_CONSTANT)
 561         {
 562           fprintf (f, " not constant");
 563           return;
 564         }
 565       if (c->code == CHANGED)
 566         {
 567           fprintf (f, " changed");
 568           return;
 569         }
 570       fprintf (f, " %s ", op_symbol_code (c->code));
 571       print_generic_expr (f, c->val, 1);
 572     }
 573 }
 574
 575
 576 /* Dump clause CLAUSE.  */
 577
 578 static void
 579 dump_clause (FILE *f, conditions conds, clause_t clause)
 580 {
 581   int i;
 582   bool found = false;
 583   fprintf (f, "(");
 584   if (!clause)
 585     fprintf (f, "true");
 586   for (i = 0; i < NUM_CONDITIONS; i++)
 587     if (clause & (1 << i))
 588       {
 589         if (found)
 590           fprintf (f, " || ");
 591         found = true;
 592         dump_condition (f, conds, i);
 593       }
 594   fprintf (f, ")");
 595 }
 596
 597
 598 /* Dump predicate PREDICATE.  */
 599
 600 static void
 601 dump_predicate (FILE *f, conditions conds, struct predicate *pred)
 602 {
 603   int i;
 604   if (true_predicate_p (pred))
 605     dump_clause (f, conds, 0);
 606   else
 607     for (i = 0; pred->clause[i]; i++)
 608       {
 609         if (i)
 610           fprintf (f, " && ");
 611         dump_clause (f, conds, pred->clause[i]);
 612       }
 613   fprintf (f, "\n");
 614 }
 615
 616
 617 /* Dump inline hints.  */
 618 void
 619 dump_inline_hints (FILE *f, inline_hints hints)
 620 {
 621   if (!hints)
 622     return;
 623   fprintf (f, "inline hints:");
 624   if (hints & INLINE_HINT_indirect_call)
 625     {
 626       hints &= ~INLINE_HINT_indirect_call;
 627       fprintf (f, " indirect_call");
 628     }
 629   if (hints & INLINE_HINT_loop_iterations)
 630     {
 631       hints &= ~INLINE_HINT_loop_iterations;
 632       fprintf (f, " loop_iterations");
 633     }
 634   if (hints & INLINE_HINT_loop_stride)
 635     {
 636       hints &= ~INLINE_HINT_loop_stride;
 637       fprintf (f, " loop_stride");
 638     }
 639   if (hints & INLINE_HINT_same_scc)
 640     {
 641       hints &= ~INLINE_HINT_same_scc;
 642       fprintf (f, " same_scc");
 643     }
 644   if (hints & INLINE_HINT_in_scc)
 645     {
 646       hints &= ~INLINE_HINT_in_scc;
 647       fprintf (f, " in_scc");
 648     }
 649   if (hints & INLINE_HINT_cross_module)
 650     {
 651       hints &= ~INLINE_HINT_cross_module;
 652       fprintf (f, " cross_module");
 653     }
 654   if (hints & INLINE_HINT_declared_inline)
 655     {
 656       hints &= ~INLINE_HINT_declared_inline;
 657       fprintf (f, " declared_inline");
 658     }
 659   if (hints & INLINE_HINT_array_index)
 660     {
 661       hints &= ~INLINE_HINT_array_index;
 662       fprintf (f, " array_index");
 663     }
 664   gcc_assert (!hints);
 665 }
 666
 667
 668 /* Record SIZE and TIME under condition PRED into the inline summary.  */
 669
 670 static void
 671 account_size_time (struct inline_summary *summary, int size, int time,
 672                    struct predicate *pred)
 673 {
 674   size_time_entry *e;
 675   bool found = false;
 676   int i;
 677
 678   if (false_predicate_p (pred))
 679     return;
 680
 681   /* We need to create initial empty unconitional clause, but otherwie
 682      we don't need to account empty times and sizes.  */
 683   if (!size && !time && summary->entry)
 684     return;
 685
 686   /* Watch overflow that might result from insane profiles.  */
 687   if (time > MAX_TIME * INLINE_TIME_SCALE)
 688     time = MAX_TIME * INLINE_TIME_SCALE;
 689   gcc_assert (time >= 0);
 690
 691   for (i = 0; vec_safe_iterate (summary->entry, i, &e); i++)
 692     if (predicates_equal_p (&e->predicate, pred))
 693       {
 694         found = true;
 695         break;
 696       }
 697   if (i == 256)
 698     {
 699       i = 0;
 700       found = true;
 701       e = &(*summary->entry)[0];
 702       gcc_assert (!e->predicate.clause[0]);
 703       if (dump_file && (dump_flags & TDF_DETAILS))
 704         fprintf (dump_file,
 705                  "\t\tReached limit on number of entries, "
 706                  "ignoring the predicate.");
 707     }
 708   if (dump_file && (dump_flags & TDF_DETAILS) && (time || size))
 709     {
 710       fprintf (dump_file,
 711                "\t\tAccounting size:%3.2f, time:%3.2f on %spredicate:",
 712                ((double) size) / INLINE_SIZE_SCALE,
 713                ((double) time) / INLINE_TIME_SCALE, found ? "" : "new ");
 714       dump_predicate (dump_file, summary->conds, pred);
 715     }
 716   if (!found)
 717     {
 718       struct size_time_entry new_entry;
 719       new_entry.size = size;
 720       new_entry.time = time;
 721       new_entry.predicate = *pred;
 722       vec_safe_push (summary->entry, new_entry);
 723     }
 724   else
 725     {
 726       e->size += size;
 727       e->time += time;
 728       if (e->time > MAX_TIME * INLINE_TIME_SCALE)
 729         e->time = MAX_TIME * INLINE_TIME_SCALE;
 730     }
 731 }
 732
 733 /* Set predicate for edge E.  */
 734
 735 static void
 736 edge_set_predicate (struct cgraph_edge *e, struct predicate *predicate)
 737 {
 738   struct inline_edge_summary *es = inline_edge_summary (e);
 739   if (predicate && !true_predicate_p (predicate))
 740     {
 741       if (!es->predicate)
 742         es->predicate = (struct predicate *) pool_alloc (edge_predicate_pool);
 743       *es->predicate = *predicate;
 744     }
 745   else
 746     {
 747       if (es->predicate)
 748         pool_free (edge_predicate_pool, es->predicate);
 749       es->predicate = NULL;
 750     }
 751 }
 752
 753 /* Set predicate for hint *P.  */
 754
 755 static void
 756 set_hint_predicate (struct predicate **p, struct predicate new_predicate)
 757 {
 758   if (false_predicate_p (&new_predicate) || true_predicate_p (&new_predicate))
 759     {
 760       if (*p)
 761         pool_free (edge_predicate_pool, *p);
 762       *p = NULL;
 763     }
 764   else
 765     {
 766       if (!*p)
 767         *p = (struct predicate *) pool_alloc (edge_predicate_pool);
 768       **p = new_predicate;
 769     }
 770 }
 771
 772
 773 /* KNOWN_VALS is partial mapping of parameters of NODE to constant values.
 774    KNOWN_AGGS is a vector of aggreggate jump functions for each parameter.
 775    Return clause of possible truths. When INLINE_P is true, assume that we are
 776    inlining.
 777
 778    ERROR_MARK means compile time invariant.  */
 779
 780 static clause_t
 781 evaluate_conditions_for_known_args (struct cgraph_node *node,
 782                                     bool inline_p,
 783                                     vec<tree> known_vals,
 784                                     vec<ipa_agg_jump_function_p>
 785                                     known_aggs)
 786 {
 787   clause_t clause = inline_p ? 0 : 1 << predicate_not_inlined_condition;
 788   struct inline_summary *info = inline_summary (node);
 789   int i;
 790   struct condition *c;
 791
 792   for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
 793     {
 794       tree val;
 795       tree res;
 796
 797       /* We allow call stmt to have fewer arguments than the callee function
 798          (especially for K&R style programs).  So bound check here (we assume
 799          known_aggs vector, if non-NULL, has the same length as
 800          known_vals).  */
 801       gcc_checking_assert (!known_aggs.exists ()
 802                            || (known_vals.length () == known_aggs.length ()));
 803       if (c->operand_num >= (int) known_vals.length ())
 804         {
 805           clause |= 1 << (i + predicate_first_dynamic_condition);
 806           continue;
 807         }
 808
 809       if (c->agg_contents)
 810         {
 811           struct ipa_agg_jump_function *agg;
 812
 813           if (c->code == CHANGED
 814               && !c->by_ref
 815               && (known_vals[c->operand_num] == error_mark_node))
 816             continue;
 817
 818           if (known_aggs.exists ())
 819             {
 820               agg = known_aggs[c->operand_num];
 821               val = ipa_find_agg_cst_for_param (agg, c->offset, c->by_ref);
 822             }
 823           else
 824             val = NULL_TREE;
 825         }
 826       else
 827         {
 828           val = known_vals[c->operand_num];
 829           if (val == error_mark_node && c->code != CHANGED)
 830             val = NULL_TREE;
 831         }
 832
 833       if (!val)
 834         {
 835           clause |= 1 << (i + predicate_first_dynamic_condition);
 836           continue;
 837         }
 838       if (c->code == IS_NOT_CONSTANT || c->code == CHANGED)
 839         continue;
 840       res = fold_binary_to_constant (c->code, boolean_type_node, val, c->val);
 841       if (res && integer_zerop (res))
 842         continue;
 843       clause |= 1 << (i + predicate_first_dynamic_condition);
 844     }
 845   return clause;
 846 }
 847
 848
 849 /* Work out what conditions might be true at invocation of E.  */
 850
 851 static void
 852 evaluate_properties_for_edge (struct cgraph_edge *e, bool inline_p,
 853                               clause_t *clause_ptr,
 854                               vec<tree> *known_vals_ptr,
 855                               vec<tree> *known_binfos_ptr,
 856                               vec<ipa_agg_jump_function_p> *known_aggs_ptr)
 857 {
 858   struct cgraph_node *callee =
 859     cgraph_function_or_thunk_node (e->callee, NULL);
 860   struct inline_summary *info = inline_summary (callee);
 861   vec<tree> known_vals = vNULL;
 862   vec<ipa_agg_jump_function_p> known_aggs = vNULL;
 863
 864   if (clause_ptr)
 865     *clause_ptr = inline_p ? 0 : 1 << predicate_not_inlined_condition;
 866   if (known_vals_ptr)
 867     known_vals_ptr->create (0);
 868   if (known_binfos_ptr)
 869     known_binfos_ptr->create (0);
 870
 871   if (ipa_node_params_vector.exists ()
 872       && !e->call_stmt_cannot_inline_p
 873       && ((clause_ptr && info->conds) || known_vals_ptr || known_binfos_ptr))
 874     {
 875       struct ipa_node_params *parms_info;
 876       struct ipa_edge_args *args = IPA_EDGE_REF (e);
 877       struct inline_edge_summary *es = inline_edge_summary (e);
 878       int i, count = ipa_get_cs_argument_count (args);
 879
 880       if (e->caller->global.inlined_to)
 881         parms_info = IPA_NODE_REF (e->caller->global.inlined_to);
 882       else
 883         parms_info = IPA_NODE_REF (e->caller);
 884
 885       if (count && (info->conds || known_vals_ptr))
 886         known_vals.safe_grow_cleared (count);
 887       if (count && (info->conds || known_aggs_ptr))
 888         known_aggs.safe_grow_cleared (count);
 889       if (count && known_binfos_ptr)
 890         known_binfos_ptr->safe_grow_cleared (count);
 891
 892       for (i = 0; i < count; i++)
 893         {
 894           struct ipa_jump_func *jf = ipa_get_ith_jump_func (args, i);
 895           tree cst = ipa_value_from_jfunc (parms_info, jf);
 896           if (cst)
 897             {
 898               if (known_vals.exists () && TREE_CODE (cst) != TREE_BINFO)
 899                 known_vals[i] = cst;
 900               else if (known_binfos_ptr != NULL
 901                        && TREE_CODE (cst) == TREE_BINFO)
 902                 (*known_binfos_ptr)[i] = cst;
 903             }
 904           else if (inline_p && !es->param[i].change_prob)
 905             known_vals[i] = error_mark_node;
 906           /* TODO: When IPA-CP starts propagating and merging aggregate jump
 907              functions, use its knowledge of the caller too, just like the
 908              scalar case above.  */
 909           known_aggs[i] = &jf->agg;
 910         }
 911     }
 912
 913   if (clause_ptr)
 914     *clause_ptr = evaluate_conditions_for_known_args (callee, inline_p,
 915                                                       known_vals, known_aggs);
 916
 917   if (known_vals_ptr)
 918     *known_vals_ptr = known_vals;
 919   else
 920     known_vals.release ();
 921
 922   if (known_aggs_ptr)
 923     *known_aggs_ptr = known_aggs;
 924   else
 925     known_aggs.release ();
 926 }
 927
 928
 929 /* Allocate the inline summary vector or resize it to cover all cgraph nodes. */
 930
 931 static void
 932 inline_summary_alloc (void)
 933 {
 934   if (!node_removal_hook_holder)
 935     node_removal_hook_holder =
 936       cgraph_add_node_removal_hook (&inline_node_removal_hook, NULL);
 937   if (!edge_removal_hook_holder)
 938     edge_removal_hook_holder =
 939       cgraph_add_edge_removal_hook (&inline_edge_removal_hook, NULL);
 940   if (!node_duplication_hook_holder)
 941     node_duplication_hook_holder =
 942       cgraph_add_node_duplication_hook (&inline_node_duplication_hook, NULL);
 943   if (!edge_duplication_hook_holder)
 944     edge_duplication_hook_holder =
 945       cgraph_add_edge_duplication_hook (&inline_edge_duplication_hook, NULL);
 946
 947   if (vec_safe_length (inline_summary_vec) <= (unsigned) cgraph_max_uid)
 948     vec_safe_grow_cleared (inline_summary_vec, cgraph_max_uid + 1);
 949   if (inline_edge_summary_vec.length () <= (unsigned) cgraph_edge_max_uid)
 950     inline_edge_summary_vec.safe_grow_cleared (cgraph_edge_max_uid + 1);
 951   if (!edge_predicate_pool)
 952     edge_predicate_pool = create_alloc_pool ("edge predicates",
 953                                              sizeof (struct predicate), 10);
 954 }
 955
 956 /* We are called multiple time for given function; clear
 957    data from previous run so they are not cumulated.  */
 958
 959 static void
 960 reset_inline_edge_summary (struct cgraph_edge *e)
 961 {
 962   if (e->uid < (int) inline_edge_summary_vec.length ())
 963     {
 964       struct inline_edge_summary *es = inline_edge_summary (e);
 965
 966       es->call_stmt_size = es->call_stmt_time = 0;
 967       if (es->predicate)
 968         pool_free (edge_predicate_pool, es->predicate);
 969       es->predicate = NULL;
 970       es->param.release ();
 971     }
 972 }
 973
 974 /* We are called multiple time for given function; clear
 975    data from previous run so they are not cumulated.  */
 976
 977 static void
 978 reset_inline_summary (struct cgraph_node *node)
 979 {
 980   struct inline_summary *info = inline_summary (node);
 981   struct cgraph_edge *e;
 982
 983   info->self_size = info->self_time = 0;
 984   info->estimated_stack_size = 0;
 985   info->estimated_self_stack_size = 0;
 986   info->stack_frame_offset = 0;
 987   info->size = 0;
 988   info->time = 0;
 989   info->growth = 0;
 990   info->scc_no = 0;
 991   if (info->loop_iterations)
 992     {
 993       pool_free (edge_predicate_pool, info->loop_iterations);
 994       info->loop_iterations = NULL;
 995     }
 996   if (info->loop_stride)
 997     {
 998       pool_free (edge_predicate_pool, info->loop_stride);
 999       info->loop_stride = NULL;
1000     }
1001   if (info->array_index)
1002     {
1003       pool_free (edge_predicate_pool, info->array_index);
1004       info->array_index = NULL;
1005     }
1006   vec_free (info->conds);
1007   vec_free (info->entry);
1008   for (e = node->callees; e; e = e->next_callee)
1009     reset_inline_edge_summary (e);
1010   for (e = node->indirect_calls; e; e = e->next_callee)
1011     reset_inline_edge_summary (e);
1012 }
1013
1014 /* Hook that is called by cgraph.c when a node is removed.  */
1015
1016 static void
1017 inline_node_removal_hook (struct cgraph_node *node,
1018                           void *data ATTRIBUTE_UNUSED)
1019 {
1020   struct inline_summary *info;
1021   if (vec_safe_length (inline_summary_vec) <= (unsigned) node->uid)
1022     return;
1023   info = inline_summary (node);
1024   reset_inline_summary (node);
1025   memset (info, 0, sizeof (inline_summary_t));
1026 }
1027
1028 /* Remap predicate P of former function to be predicate of duplicated functoin.
1029    POSSIBLE_TRUTHS is clause of possible truths in the duplicated node,
1030    INFO is inline summary of the duplicated node.  */
1031
1032 static struct predicate
1033 remap_predicate_after_duplication (struct predicate *p,
1034                                    clause_t possible_truths,
1035                                    struct inline_summary *info)
1036 {
1037   struct predicate new_predicate = true_predicate ();
1038   int j;
1039   for (j = 0; p->clause[j]; j++)
1040     if (!(possible_truths & p->clause[j]))
1041       {
1042         new_predicate = false_predicate ();
1043         break;
1044       }
1045     else
1046       add_clause (info->conds, &new_predicate,
1047                   possible_truths & p->clause[j]);
1048   return new_predicate;
1049 }
1050
1051 /* Same as remap_predicate_after_duplication but handle hint predicate *P.
1052    Additionally care about allocating new memory slot for updated predicate
1053    and set it to NULL when it becomes true or false (and thus uninteresting).
1054  */
1055
1056 static void
1057 remap_hint_predicate_after_duplication (struct predicate **p,
1058                                         clause_t possible_truths,
1059                                         struct inline_summary *info)
1060 {
1061   struct predicate new_predicate;
1062
1063   if (!*p)
1064     return;
1065
1066   new_predicate = remap_predicate_after_duplication (*p,
1067                                                      possible_truths, info);
1068   /* We do not want to free previous predicate; it is used by node origin.  */
1069   *p = NULL;
1070   set_hint_predicate (p, new_predicate);
1071 }
1072
1073
1074 /* Hook that is called by cgraph.c when a node is duplicated.  */
1075
1076 static void
1077 inline_node_duplication_hook (struct cgraph_node *src,
1078                               struct cgraph_node *dst,
1079                               ATTRIBUTE_UNUSED void *data)
1080 {
1081   struct inline_summary *info;
1082   inline_summary_alloc ();
1083   info = inline_summary (dst);
1084   memcpy (info, inline_summary (src), sizeof (struct inline_summary));
1085   /* TODO: as an optimization, we may avoid copying conditions
1086      that are known to be false or true.  */
1087   info->conds = vec_safe_copy (info->conds);
1088
1089   /* When there are any replacements in the function body, see if we can figure
1090      out that something was optimized out.  */
1091   if (ipa_node_params_vector.exists () && dst->clone.tree_map)
1092     {
1093       vec<size_time_entry, va_gc> *entry = info->entry;
1094       /* Use SRC parm info since it may not be copied yet.  */
1095       struct ipa_node_params *parms_info = IPA_NODE_REF (src);
1096       vec<tree> known_vals = vNULL;
1097       int count = ipa_get_param_count (parms_info);
1098       int i, j;
1099       clause_t possible_truths;
1100       struct predicate true_pred = true_predicate ();
1101       size_time_entry *e;
1102       int optimized_out_size = 0;
1103       bool inlined_to_p = false;
1104       struct cgraph_edge *edge;
1105
1106       info->entry = 0;
1107       known_vals.safe_grow_cleared (count);
1108       for (i = 0; i < count; i++)
1109         {
1110           struct ipa_replace_map *r;
1111
1112           for (j = 0; vec_safe_iterate (dst->clone.tree_map, j, &r); j++)
1113             {
1114               if (((!r->old_tree && r->parm_num == i)
1115                    || (r->old_tree && r->old_tree == ipa_get_param (parms_info, i)))
1116                    && r->replace_p && !r->ref_p)
1117                 {
1118                   known_vals[i] = r->new_tree;
1119                   break;
1120                 }
1121             }
1122         }
1123       possible_truths = evaluate_conditions_for_known_args (dst, false,
1124                                                             known_vals,
1125                                                             vNULL);
1126       known_vals.release ();
1127
1128       account_size_time (info, 0, 0, &true_pred);
1129
1130       /* Remap size_time vectors.
1131          Simplify the predicate by prunning out alternatives that are known
1132          to be false.
1133          TODO: as on optimization, we can also eliminate conditions known
1134          to be true.  */
1135       for (i = 0; vec_safe_iterate (entry, i, &e); i++)
1136         {
1137           struct predicate new_predicate;
1138           new_predicate = remap_predicate_after_duplication (&e->predicate,
1139                                                              possible_truths,
1140                                                              info);
1141           if (false_predicate_p (&new_predicate))
1142             optimized_out_size += e->size;
1143           else
1144             account_size_time (info, e->size, e->time, &new_predicate);
1145         }
1146
1147       /* Remap edge predicates with the same simplification as above.
1148          Also copy constantness arrays.   */
1149       for (edge = dst->callees; edge; edge = edge->next_callee)
1150         {
1151           struct predicate new_predicate;
1152           struct inline_edge_summary *es = inline_edge_summary (edge);
1153
1154           if (!edge->inline_failed)
1155             inlined_to_p = true;
1156           if (!es->predicate)
1157             continue;
1158           new_predicate = remap_predicate_after_duplication (es->predicate,
1159                                                              possible_truths,
1160                                                              info);
1161           if (false_predicate_p (&new_predicate)
1162               && !false_predicate_p (es->predicate))
1163             {
1164               optimized_out_size += es->call_stmt_size * INLINE_SIZE_SCALE;
1165               edge->frequency = 0;
1166             }
1167           edge_set_predicate (edge, &new_predicate);
1168         }
1169
1170       /* Remap indirect edge predicates with the same simplificaiton as above.
1171          Also copy constantness arrays.   */
1172       for (edge = dst->indirect_calls; edge; edge = edge->next_callee)
1173         {
1174           struct predicate new_predicate;
1175           struct inline_edge_summary *es = inline_edge_summary (edge);
1176
1177           gcc_checking_assert (edge->inline_failed);
1178           if (!es->predicate)
1179             continue;
1180           new_predicate = remap_predicate_after_duplication (es->predicate,
1181                                                              possible_truths,
1182                                                              info);
1183           if (false_predicate_p (&new_predicate)
1184               && !false_predicate_p (es->predicate))
1185             {
1186               optimized_out_size += es->call_stmt_size * INLINE_SIZE_SCALE;
1187               edge->frequency = 0;
1188             }
1189           edge_set_predicate (edge, &new_predicate);
1190         }
1191       remap_hint_predicate_after_duplication (&info->loop_iterations,
1192                                               possible_truths, info);
1193       remap_hint_predicate_after_duplication (&info->loop_stride,
1194                                               possible_truths, info);
1195       remap_hint_predicate_after_duplication (&info->array_index,
1196                                               possible_truths, info);
1197
1198       /* If inliner or someone after inliner will ever start producing
1199          non-trivial clones, we will get trouble with lack of information
1200          about updating self sizes, because size vectors already contains
1201          sizes of the calees.  */
1202       gcc_assert (!inlined_to_p || !optimized_out_size);
1203     }
1204   else
1205     {
1206       info->entry = vec_safe_copy (info->entry);
1207       if (info->loop_iterations)
1208         {
1209           predicate p = *info->loop_iterations;
1210           info->loop_iterations = NULL;
1211           set_hint_predicate (&info->loop_iterations, p);
1212         }
1213       if (info->loop_stride)
1214         {
1215           predicate p = *info->loop_stride;
1216           info->loop_stride = NULL;
1217           set_hint_predicate (&info->loop_stride, p);
1218         }
1219       if (info->array_index)
1220         {
1221           predicate p = *info->array_index;
1222           info->array_index = NULL;
1223           set_hint_predicate (&info->array_index, p);
1224         }
1225     }
1226   inline_update_overall_summary (dst);
1227 }
1228
1229
1230 /* Hook that is called by cgraph.c when a node is duplicated.  */
1231
1232 static void
1233 inline_edge_duplication_hook (struct cgraph_edge *src,
1234                               struct cgraph_edge *dst,
1235                               ATTRIBUTE_UNUSED void *data)
1236 {
1237   struct inline_edge_summary *info;
1238   struct inline_edge_summary *srcinfo;
1239   inline_summary_alloc ();
1240   info = inline_edge_summary (dst);
1241   srcinfo = inline_edge_summary (src);
1242   memcpy (info, srcinfo, sizeof (struct inline_edge_summary));
1243   info->predicate = NULL;
1244   edge_set_predicate (dst, srcinfo->predicate);
1245   info->param = srcinfo->param.copy ();
1246 }
1247
1248
1249 /* Keep edge cache consistent across edge removal.  */
1250
1251 static void
1252 inline_edge_removal_hook (struct cgraph_edge *edge,
1253                           void *data ATTRIBUTE_UNUSED)
1254 {
1255   if (edge_growth_cache.exists ())
1256     reset_edge_growth_cache (edge);
1257   reset_inline_edge_summary (edge);
1258 }
1259
1260
1261 /* Initialize growth caches.  */
1262
1263 void
1264 initialize_growth_caches (void)
1265 {
1266   if (cgraph_edge_max_uid)
1267     edge_growth_cache.safe_grow_cleared (cgraph_edge_max_uid);
1268   if (cgraph_max_uid)
1269     node_growth_cache.safe_grow_cleared (cgraph_max_uid);
1270 }
1271
1272
1273 /* Free growth caches.  */
1274
1275 void
1276 free_growth_caches (void)
1277 {
1278   edge_growth_cache.release ();
1279   node_growth_cache.release ();
1280 }
1281
1282
1283 /* Dump edge summaries associated to NODE and recursively to all clones.
1284    Indent by INDENT.  */
1285
1286 static void
1287 dump_inline_edge_summary (FILE *f, int indent, struct cgraph_node *node,
1288                           struct inline_summary *info)
1289 {
1290   struct cgraph_edge *edge;
1291   for (edge = node->callees; edge; edge = edge->next_callee)
1292     {
1293       struct inline_edge_summary *es = inline_edge_summary (edge);
1294       struct cgraph_node *callee =
1295         cgraph_function_or_thunk_node (edge->callee, NULL);
1296       int i;
1297
1298       fprintf (f,
1299                "%*s%s/%i %s\n%*s  loop depth:%2i freq:%4i size:%2i"
1300                " time: %2i callee size:%2i stack:%2i",
1301                indent, "", cgraph_node_name (callee), callee->symbol.order,
1302                !edge->inline_failed
1303                ? "inlined" : cgraph_inline_failed_string (edge-> inline_failed),
1304                indent, "", es->loop_depth, edge->frequency,
1305                es->call_stmt_size, es->call_stmt_time,
1306                (int) inline_summary (callee)->size / INLINE_SIZE_SCALE,
1307                (int) inline_summary (callee)->estimated_stack_size);
1308
1309       if (es->predicate)
1310         {
1311           fprintf (f, " predicate: ");
1312           dump_predicate (f, info->conds, es->predicate);
1313         }
1314       else
1315         fprintf (f, "\n");
1316       if (es->param.exists ())
1317         for (i = 0; i < (int) es->param.length (); i++)
1318           {
1319             int prob = es->param[i].change_prob;
1320
1321             if (!prob)
1322               fprintf (f, "%*s op%i is compile time invariant\n",
1323                        indent + 2, "", i);
1324             else if (prob != REG_BR_PROB_BASE)
1325               fprintf (f, "%*s op%i change %f%% of time\n", indent + 2, "", i,
1326                        prob * 100.0 / REG_BR_PROB_BASE);
1327           }
1328       if (!edge->inline_failed)
1329         {
1330           fprintf (f, "%*sStack frame offset %i, callee self size %i,"
1331                    " callee size %i\n",
1332                    indent + 2, "",
1333                    (int) inline_summary (callee)->stack_frame_offset,
1334                    (int) inline_summary (callee)->estimated_self_stack_size,
1335                    (int) inline_summary (callee)->estimated_stack_size);
1336           dump_inline_edge_summary (f, indent + 2, callee, info);
1337         }
1338     }
1339   for (edge = node->indirect_calls; edge; edge = edge->next_callee)
1340     {
1341       struct inline_edge_summary *es = inline_edge_summary (edge);
1342       fprintf (f, "%*sindirect call loop depth:%2i freq:%4i size:%2i"
1343                " time: %2i",
1344                indent, "",
1345                es->loop_depth,
1346                edge->frequency, es->call_stmt_size, es->call_stmt_time);
1347       if (es->predicate)
1348         {
1349           fprintf (f, "predicate: ");
1350           dump_predicate (f, info->conds, es->predicate);
1351         }
1352       else
1353         fprintf (f, "\n");
1354     }
1355 }
1356
1357
1358 void
1359 dump_inline_summary (FILE *f, struct cgraph_node *node)
1360 {
1361   if (node->symbol.definition)
1362     {
1363       struct inline_summary *s = inline_summary (node);
1364       size_time_entry *e;
1365       int i;
1366       fprintf (f, "Inline summary for %s/%i", cgraph_node_name (node),
1367                node->symbol.order);
1368       if (DECL_DISREGARD_INLINE_LIMITS (node->symbol.decl))
1369         fprintf (f, " always_inline");
1370       if (s->inlinable)
1371         fprintf (f, " inlinable");
1372       fprintf (f, "\n  self time:       %i\n", s->self_time);
1373       fprintf (f, "  global time:     %i\n", s->time);
1374       fprintf (f, "  self size:       %i\n", s->self_size);
1375       fprintf (f, "  global size:     %i\n", s->size);
1376       fprintf (f, "  self stack:      %i\n",
1377                (int) s->estimated_self_stack_size);
1378       fprintf (f, "  global stack:    %i\n", (int) s->estimated_stack_size);
1379       if (s->growth)
1380         fprintf (f, "  estimated growth:%i\n", (int) s->growth);
1381       if (s->scc_no)
1382         fprintf (f, "  In SCC:          %i\n", (int) s->scc_no);
1383       for (i = 0; vec_safe_iterate (s->entry, i, &e); i++)
1384         {
1385           fprintf (f, "    size:%f, time:%f, predicate:",
1386                    (double) e->size / INLINE_SIZE_SCALE,
1387                    (double) e->time / INLINE_TIME_SCALE);
1388           dump_predicate (f, s->conds, &e->predicate);
1389         }
1390       if (s->loop_iterations)
1391         {
1392           fprintf (f, "  loop iterations:");
1393           dump_predicate (f, s->conds, s->loop_iterations);
1394         }
1395       if (s->loop_stride)
1396         {
1397           fprintf (f, "  loop stride:");
1398           dump_predicate (f, s->conds, s->loop_stride);
1399         }
1400       if (s->array_index)
1401         {
1402           fprintf (f, "  array index:");
1403           dump_predicate (f, s->conds, s->array_index);
1404         }
1405       fprintf (f, "  calls:\n");
1406       dump_inline_edge_summary (f, 4, node, s);
1407       fprintf (f, "\n");
1408     }
1409 }
1410
1411 DEBUG_FUNCTION void
1412 debug_inline_summary (struct cgraph_node *node)
1413 {
1414   dump_inline_summary (stderr, node);
1415 }
1416
1417 void
1418 dump_inline_summaries (FILE *f)
1419 {
1420   struct cgraph_node *node;
1421
1422   FOR_EACH_DEFINED_FUNCTION (node)
1423     if (!node->global.inlined_to)
1424       dump_inline_summary (f, node);
1425 }
1426
1427 /* Give initial reasons why inlining would fail on EDGE.  This gets either
1428    nullified or usually overwritten by more precise reasons later.  */
1429
1430 void
1431 initialize_inline_failed (struct cgraph_edge *e)
1432 {
1433   struct cgraph_node *callee = e->callee;
1434
1435   if (e->indirect_unknown_callee)
1436     e->inline_failed = CIF_INDIRECT_UNKNOWN_CALL;
1437   else if (!callee->symbol.definition)
1438     e->inline_failed = CIF_BODY_NOT_AVAILABLE;
1439   else if (callee->local.redefined_extern_inline)
1440     e->inline_failed = CIF_REDEFINED_EXTERN_INLINE;
1441   else if (e->call_stmt_cannot_inline_p)
1442     e->inline_failed = CIF_MISMATCHED_ARGUMENTS;
1443   else
1444     e->inline_failed = CIF_FUNCTION_NOT_CONSIDERED;
1445 }
1446
1447 /* Callback of walk_aliased_vdefs.  Flags that it has been invoked to the
1448    boolean variable pointed to by DATA.  */
1449
1450 static bool
1451 mark_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef ATTRIBUTE_UNUSED,
1452                void *data)
1453 {
1454   bool *b = (bool *) data;
1455   *b = true;
1456   return true;
1457 }
1458
1459 /* If OP refers to value of function parameter, return the corresponding
1460    parameter.  */
1461
1462 static tree
1463 unmodified_parm_1 (gimple stmt, tree op)
1464 {
1465   /* SSA_NAME referring to parm default def?  */
1466   if (TREE_CODE (op) == SSA_NAME
1467       && SSA_NAME_IS_DEFAULT_DEF (op)
1468       && TREE_CODE (SSA_NAME_VAR (op)) == PARM_DECL)
1469     return SSA_NAME_VAR (op);
1470   /* Non-SSA parm reference?  */
1471   if (TREE_CODE (op) == PARM_DECL)
1472     {
1473       bool modified = false;
1474
1475       ao_ref refd;
1476       ao_ref_init (&refd, op);
1477       walk_aliased_vdefs (&refd, gimple_vuse (stmt), mark_modified, &modified,
1478                           NULL);
1479       if (!modified)
1480         return op;
1481     }
1482   return NULL_TREE;
1483 }
1484
1485 /* If OP refers to value of function parameter, return the corresponding
1486    parameter.  Also traverse chains of SSA register assignments.  */
1487
1488 static tree
1489 unmodified_parm (gimple stmt, tree op)
1490 {
1491   tree res = unmodified_parm_1 (stmt, op);
1492   if (res)
1493     return res;
1494
1495   if (TREE_CODE (op) == SSA_NAME
1496       && !SSA_NAME_IS_DEFAULT_DEF (op)
1497       && gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1498     return unmodified_parm (SSA_NAME_DEF_STMT (op),
1499                             gimple_assign_rhs1 (SSA_NAME_DEF_STMT (op)));
1500   return NULL_TREE;
1501 }
1502
1503 /* If OP refers to a value of a function parameter or value loaded from an
1504    aggregate passed to a parameter (either by value or reference), return TRUE
1505    and store the number of the parameter to *INDEX_P and information whether
1506    and how it has been loaded from an aggregate into *AGGPOS.  INFO describes
1507    the function parameters, STMT is the statement in which OP is used or
1508    loaded.  */
1509
1510 static bool
1511 unmodified_parm_or_parm_agg_item (struct ipa_node_params *info,
1512                                   gimple stmt, tree op, int *index_p,
1513                                   struct agg_position_info *aggpos)
1514 {
1515   tree res = unmodified_parm_1 (stmt, op);
1516
1517   gcc_checking_assert (aggpos);
1518   if (res)
1519     {
1520       *index_p = ipa_get_param_decl_index (info, res);
1521       if (*index_p < 0)
1522         return false;
1523       aggpos->agg_contents = false;
1524       aggpos->by_ref = false;
1525       return true;
1526     }
1527
1528   if (TREE_CODE (op) == SSA_NAME)
1529     {
1530       if (SSA_NAME_IS_DEFAULT_DEF (op)
1531           || !gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1532         return false;
1533       stmt = SSA_NAME_DEF_STMT (op);
1534       op = gimple_assign_rhs1 (stmt);
1535       if (!REFERENCE_CLASS_P (op))
1536         return unmodified_parm_or_parm_agg_item (info, stmt, op, index_p,
1537                                                  aggpos);
1538     }
1539
1540   aggpos->agg_contents = true;
1541   return ipa_load_from_parm_agg (info, stmt, op, index_p, &aggpos->offset,
1542                                  &aggpos->by_ref);
1543 }
1544
1545 /* See if statement might disappear after inlining.
1546    0 - means not eliminated
1547    1 - half of statements goes away
1548    2 - for sure it is eliminated.
1549    We are not terribly sophisticated, basically looking for simple abstraction
1550    penalty wrappers.  */
1551
1552 static int
1553 eliminated_by_inlining_prob (gimple stmt)
1554 {
1555   enum gimple_code code = gimple_code (stmt);
1556   enum tree_code rhs_code;
1557
1558   if (!optimize)
1559     return 0;
1560
1561   switch (code)
1562     {
1563     case GIMPLE_RETURN:
1564       return 2;
1565     case GIMPLE_ASSIGN:
1566       if (gimple_num_ops (stmt) != 2)
1567         return 0;
1568
1569       rhs_code = gimple_assign_rhs_code (stmt);
1570
1571       /* Casts of parameters, loads from parameters passed by reference
1572          and stores to return value or parameters are often free after
1573          inlining dua to SRA and further combining.
1574          Assume that half of statements goes away.  */
1575       if (rhs_code == CONVERT_EXPR
1576           || rhs_code == NOP_EXPR
1577           || rhs_code == VIEW_CONVERT_EXPR
1578           || rhs_code == ADDR_EXPR
1579           || gimple_assign_rhs_class (stmt) == GIMPLE_SINGLE_RHS)
1580         {
1581           tree rhs = gimple_assign_rhs1 (stmt);
1582           tree lhs = gimple_assign_lhs (stmt);
1583           tree inner_rhs = get_base_address (rhs);
1584           tree inner_lhs = get_base_address (lhs);
1585           bool rhs_free = false;
1586           bool lhs_free = false;
1587
1588           if (!inner_rhs)
1589             inner_rhs = rhs;
1590           if (!inner_lhs)
1591             inner_lhs = lhs;
1592
1593           /* Reads of parameter are expected to be free.  */
1594           if (unmodified_parm (stmt, inner_rhs))
1595             rhs_free = true;
1596           /* Match expressions of form &this->field. Those will most likely
1597              combine with something upstream after inlining.  */
1598           else if (TREE_CODE (inner_rhs) == ADDR_EXPR)
1599             {
1600               tree op = get_base_address (TREE_OPERAND (inner_rhs, 0));
1601               if (TREE_CODE (op) == PARM_DECL)
1602                 rhs_free = true;
1603               else if (TREE_CODE (op) == MEM_REF
1604                        && unmodified_parm (stmt, TREE_OPERAND (op, 0)))
1605                 rhs_free = true;
1606             }
1607
1608           /* When parameter is not SSA register because its address is taken
1609              and it is just copied into one, the statement will be completely
1610              free after inlining (we will copy propagate backward).   */
1611           if (rhs_free && is_gimple_reg (lhs))
1612             return 2;
1613
1614           /* Reads of parameters passed by reference
1615              expected to be free (i.e. optimized out after inlining).  */
1616           if (TREE_CODE (inner_rhs) == MEM_REF
1617               && unmodified_parm (stmt, TREE_OPERAND (inner_rhs, 0)))
1618             rhs_free = true;
1619
1620           /* Copying parameter passed by reference into gimple register is
1621              probably also going to copy propagate, but we can't be quite
1622              sure.  */
1623           if (rhs_free && is_gimple_reg (lhs))
1624             lhs_free = true;
1625
1626           /* Writes to parameters, parameters passed by value and return value
1627              (either dirrectly or passed via invisible reference) are free.
1628
1629              TODO: We ought to handle testcase like
1630              struct a {int a,b;};
1631              struct a
1632              retrurnsturct (void)
1633              {
1634              struct a a ={1,2};
1635              return a;
1636              }
1637
1638              This translate into:
1639
1640              retrurnsturct ()
1641              {
1642              int a$b;
1643              int a$a;
1644              struct a a;
1645              struct a D.2739;
1646
1647              <bb 2>:
1648              D.2739.a = 1;
1649              D.2739.b = 2;
1650              return D.2739;
1651
1652              }
1653              For that we either need to copy ipa-split logic detecting writes
1654              to return value.  */
1655           if (TREE_CODE (inner_lhs) == PARM_DECL
1656               || TREE_CODE (inner_lhs) == RESULT_DECL
1657               || (TREE_CODE (inner_lhs) == MEM_REF
1658                   && (unmodified_parm (stmt, TREE_OPERAND (inner_lhs, 0))
1659                       || (TREE_CODE (TREE_OPERAND (inner_lhs, 0)) == SSA_NAME
1660                           && SSA_NAME_VAR (TREE_OPERAND (inner_lhs, 0))
1661                           && TREE_CODE (SSA_NAME_VAR (TREE_OPERAND
1662                                                       (inner_lhs,
1663                                                        0))) == RESULT_DECL))))
1664             lhs_free = true;
1665           if (lhs_free
1666               && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
1667             rhs_free = true;
1668           if (lhs_free && rhs_free)
1669             return 1;
1670         }
1671       return 0;
1672     default:
1673       return 0;
1674     }
1675 }
1676
1677
1678 /* If BB ends by a conditional we can turn into predicates, attach corresponding
1679    predicates to the CFG edges.   */
1680
1681 static void
1682 set_cond_stmt_execution_predicate (struct ipa_node_params *info,
1683                                    struct inline_summary *summary,
1684                                    basic_block bb)
1685 {
1686   gimple last;
1687   tree op;
1688   int index;
1689   struct agg_position_info aggpos;
1690   enum tree_code code, inverted_code;
1691   edge e;
1692   edge_iterator ei;
1693   gimple set_stmt;
1694   tree op2;
1695
1696   last = last_stmt (bb);
1697   if (!last || gimple_code (last) != GIMPLE_COND)
1698     return;
1699   if (!is_gimple_ip_invariant (gimple_cond_rhs (last)))
1700     return;
1701   op = gimple_cond_lhs (last);
1702   /* TODO: handle conditionals like
1703      var = op0 < 4;
1704      if (var != 0).  */
1705   if (unmodified_parm_or_parm_agg_item (info, last, op, &index, &aggpos))
1706     {
1707       code = gimple_cond_code (last);
1708       inverted_code
1709         = invert_tree_comparison (code,
1710                                   HONOR_NANS (TYPE_MODE (TREE_TYPE (op))));
1711
1712       FOR_EACH_EDGE (e, ei, bb->succs)
1713         {
1714           struct predicate p = add_condition (summary, index, &aggpos,
1715                                               e->flags & EDGE_TRUE_VALUE
1716                                               ? code : inverted_code,
1717                                               gimple_cond_rhs (last));
1718           e->aux = pool_alloc (edge_predicate_pool);
1719           *(struct predicate *) e->aux = p;
1720         }
1721     }
1722
1723   if (TREE_CODE (op) != SSA_NAME)
1724     return;
1725   /* Special case
1726      if (builtin_constant_p (op))
1727      constant_code
1728      else
1729      nonconstant_code.
1730      Here we can predicate nonconstant_code.  We can't
1731      really handle constant_code since we have no predicate
1732      for this and also the constant code is not known to be
1733      optimized away when inliner doen't see operand is constant.
1734      Other optimizers might think otherwise.  */
1735   if (gimple_cond_code (last) != NE_EXPR
1736       || !integer_zerop (gimple_cond_rhs (last)))
1737     return;
1738   set_stmt = SSA_NAME_DEF_STMT (op);
1739   if (!gimple_call_builtin_p (set_stmt, BUILT_IN_CONSTANT_P)
1740       || gimple_call_num_args (set_stmt) != 1)
1741     return;
1742   op2 = gimple_call_arg (set_stmt, 0);
1743   if (!unmodified_parm_or_parm_agg_item
1744       (info, set_stmt, op2, &index, &aggpos))
1745     return;
1746   FOR_EACH_EDGE (e, ei, bb->succs) if (e->flags & EDGE_FALSE_VALUE)
1747     {
1748       struct predicate p = add_condition (summary, index, &aggpos,
1749                                           IS_NOT_CONSTANT, NULL_TREE);
1750       e->aux = pool_alloc (edge_predicate_pool);
1751       *(struct predicate *) e->aux = p;
1752     }
1753 }
1754
1755
1756 /* If BB ends by a switch we can turn into predicates, attach corresponding
1757    predicates to the CFG edges.   */
1758
1759 static void
1760 set_switch_stmt_execution_predicate (struct ipa_node_params *info,
1761                                      struct inline_summary *summary,
1762                                      basic_block bb)
1763 {
1764   gimple last;
1765   tree op;
1766   int index;
1767   struct agg_position_info aggpos;
1768   edge e;
1769   edge_iterator ei;
1770   size_t n;
1771   size_t case_idx;
1772
1773   last = last_stmt (bb);
1774   if (!last || gimple_code (last) != GIMPLE_SWITCH)
1775     return;
1776   op = gimple_switch_index (last);
1777   if (!unmodified_parm_or_parm_agg_item (info, last, op, &index, &aggpos))
1778     return;
1779
1780   FOR_EACH_EDGE (e, ei, bb->succs)
1781     {
1782       e->aux = pool_alloc (edge_predicate_pool);
1783       *(struct predicate *) e->aux = false_predicate ();
1784     }
1785   n = gimple_switch_num_labels (last);
1786   for (case_idx = 0; case_idx < n; ++case_idx)
1787     {
1788       tree cl = gimple_switch_label (last, case_idx);
1789       tree min, max;
1790       struct predicate p;
1791
1792       e = find_edge (bb, label_to_block (CASE_LABEL (cl)));
1793       min = CASE_LOW (cl);
1794       max = CASE_HIGH (cl);
1795
1796       /* For default we might want to construct predicate that none
1797          of cases is met, but it is bit hard to do not having negations
1798          of conditionals handy.  */
1799       if (!min && !max)
1800         p = true_predicate ();
1801       else if (!max)
1802         p = add_condition (summary, index, &aggpos, EQ_EXPR, min);
1803       else
1804         {
1805           struct predicate p1, p2;
1806           p1 = add_condition (summary, index, &aggpos, GE_EXPR, min);
1807           p2 = add_condition (summary, index, &aggpos, LE_EXPR, max);
1808           p = and_predicates (summary->conds, &p1, &p2);
1809         }
1810       *(struct predicate *) e->aux
1811         = or_predicates (summary->conds, &p, (struct predicate *) e->aux);
1812     }
1813 }
1814
1815
1816 /* For each BB in NODE attach to its AUX pointer predicate under
1817    which it is executable.  */
1818
1819 static void
1820 compute_bb_predicates (struct cgraph_node *node,
1821                        struct ipa_node_params *parms_info,
1822                        struct inline_summary *summary)
1823 {
1824   struct function *my_function = DECL_STRUCT_FUNCTION (node->symbol.decl);
1825   bool done = false;
1826   basic_block bb;
1827
1828   FOR_EACH_BB_FN (bb, my_function)
1829     {
1830       set_cond_stmt_execution_predicate (parms_info, summary, bb);
1831       set_switch_stmt_execution_predicate (parms_info, summary, bb);
1832     }
1833
1834   /* Entry block is always executable.  */
1835   ENTRY_BLOCK_PTR_FOR_FUNCTION (my_function)->aux
1836     = pool_alloc (edge_predicate_pool);
1837   *(struct predicate *) ENTRY_BLOCK_PTR_FOR_FUNCTION (my_function)->aux
1838     = true_predicate ();
1839
1840   /* A simple dataflow propagation of predicates forward in the CFG.
1841      TODO: work in reverse postorder.  */
1842   while (!done)
1843     {
1844       done = true;
1845       FOR_EACH_BB_FN (bb, my_function)
1846         {
1847           struct predicate p = false_predicate ();
1848           edge e;
1849           edge_iterator ei;
1850           FOR_EACH_EDGE (e, ei, bb->preds)
1851             {
1852               if (e->src->aux)
1853                 {
1854                   struct predicate this_bb_predicate
1855                     = *(struct predicate *) e->src->aux;
1856                   if (e->aux)
1857                     this_bb_predicate
1858                       = and_predicates (summary->conds, &this_bb_predicate,
1859                                         (struct predicate *) e->aux);
1860                   p = or_predicates (summary->conds, &p, &this_bb_predicate);
1861                   if (true_predicate_p (&p))
1862                     break;
1863                 }
1864             }
1865           if (false_predicate_p (&p))
1866             gcc_assert (!bb->aux);
1867           else
1868             {
1869               if (!bb->aux)
1870                 {
1871                   done = false;
1872                   bb->aux = pool_alloc (edge_predicate_pool);
1873                   *((struct predicate *) bb->aux) = p;
1874                 }
1875               else if (!predicates_equal_p (&p, (struct predicate *) bb->aux))
1876                 {
1877                   done = false;
1878                   *((struct predicate *) bb->aux) = p;
1879                 }
1880             }
1881         }
1882     }
1883 }
1884
1885
1886 /* We keep info about constantness of SSA names.  */
1887
1888 typedef struct predicate predicate_t;
1889 /* Return predicate specifying when the STMT might have result that is not
1890    a compile time constant.  */
1891
1892 static struct predicate
1893 will_be_nonconstant_expr_predicate (struct ipa_node_params *info,
1894                                     struct inline_summary *summary,
1895                                     tree expr,
1896                                     vec<predicate_t> nonconstant_names)
1897 {
1898   tree parm;
1899   int index;
1900
1901   while (UNARY_CLASS_P (expr))
1902     expr = TREE_OPERAND (expr, 0);
1903
1904   parm = unmodified_parm (NULL, expr);
1905   if (parm && (index = ipa_get_param_decl_index (info, parm)) >= 0)
1906     return add_condition (summary, index, NULL, CHANGED, NULL_TREE);
1907   if (is_gimple_min_invariant (expr))
1908     return false_predicate ();
1909   if (TREE_CODE (expr) == SSA_NAME)
1910     return nonconstant_names[SSA_NAME_VERSION (expr)];
1911   if (BINARY_CLASS_P (expr) || COMPARISON_CLASS_P (expr))
1912     {
1913       struct predicate p1 = will_be_nonconstant_expr_predicate
1914         (info, summary, TREE_OPERAND (expr, 0),
1915          nonconstant_names);
1916       struct predicate p2;
1917       if (true_predicate_p (&p1))
1918         return p1;
1919       p2 = will_be_nonconstant_expr_predicate (info, summary,
1920                                                TREE_OPERAND (expr, 1),
1921                                                nonconstant_names);
1922       return or_predicates (summary->conds, &p1, &p2);
1923     }
1924   else if (TREE_CODE (expr) == COND_EXPR)
1925     {
1926       struct predicate p1 = will_be_nonconstant_expr_predicate
1927         (info, summary, TREE_OPERAND (expr, 0),
1928          nonconstant_names);
1929       struct predicate p2;
1930       if (true_predicate_p (&p1))
1931         return p1;
1932       p2 = will_be_nonconstant_expr_predicate (info, summary,
1933                                                TREE_OPERAND (expr, 1),
1934                                                nonconstant_names);
1935       if (true_predicate_p (&p2))
1936         return p2;
1937       p1 = or_predicates (summary->conds, &p1, &p2);
1938       p2 = will_be_nonconstant_expr_predicate (info, summary,
1939                                                TREE_OPERAND (expr, 2),
1940                                                nonconstant_names);
1941       return or_predicates (summary->conds, &p1, &p2);
1942     }
1943   else
1944     {
1945       debug_tree (expr);
1946       gcc_unreachable ();
1947     }
1948   return false_predicate ();
1949 }
1950
1951
1952 /* Return predicate specifying when the STMT might have result that is not
1953    a compile time constant.  */
1954
1955 static struct predicate
1956 will_be_nonconstant_predicate (struct ipa_node_params *info,
1957                                struct inline_summary *summary,
1958                                gimple stmt,
1959                                vec<predicate_t> nonconstant_names)
1960 {
1961   struct predicate p = true_predicate ();
1962   ssa_op_iter iter;
1963   tree use;
1964   struct predicate op_non_const;
1965   bool is_load;
1966   int base_index;
1967   struct agg_position_info aggpos;
1968
1969   /* What statments might be optimized away
1970      when their arguments are constant
1971      TODO: also trivial builtins.
1972      builtin_constant_p is already handled later.  */
1973   if (gimple_code (stmt) != GIMPLE_ASSIGN
1974       && gimple_code (stmt) != GIMPLE_COND
1975       && gimple_code (stmt) != GIMPLE_SWITCH)
1976     return p;
1977
1978   /* Stores will stay anyway.  */
1979   if (gimple_store_p (stmt))
1980     return p;
1981
1982   is_load = gimple_assign_load_p (stmt);
1983
1984   /* Loads can be optimized when the value is known.  */
1985   if (is_load)
1986     {
1987       tree op;
1988       gcc_assert (gimple_assign_single_p (stmt));
1989       op = gimple_assign_rhs1 (stmt);
1990       if (!unmodified_parm_or_parm_agg_item (info, stmt, op, &base_index,
1991                                              &aggpos))
1992         return p;
1993     }
1994   else
1995     base_index = -1;
1996
1997   /* See if we understand all operands before we start
1998      adding conditionals.  */
1999   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2000     {
2001       tree parm = unmodified_parm (stmt, use);
2002       /* For arguments we can build a condition.  */
2003       if (parm && ipa_get_param_decl_index (info, parm) >= 0)
2004         continue;
2005       if (TREE_CODE (use) != SSA_NAME)
2006         return p;
2007       /* If we know when operand is constant,
2008          we still can say something useful.  */
2009       if (!true_predicate_p (&nonconstant_names[SSA_NAME_VERSION (use)]))
2010         continue;
2011       return p;
2012     }
2013
2014   if (is_load)
2015     op_non_const =
2016       add_condition (summary, base_index, &aggpos, CHANGED, NULL);
2017   else
2018     op_non_const = false_predicate ();
2019   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2020     {
2021       tree parm = unmodified_parm (stmt, use);
2022       int index;
2023
2024       if (parm && (index = ipa_get_param_decl_index (info, parm)) >= 0)
2025         {
2026           if (index != base_index)
2027             p = add_condition (summary, index, NULL, CHANGED, NULL_TREE);
2028           else
2029             continue;
2030         }
2031       else
2032         p = nonconstant_names[SSA_NAME_VERSION (use)];
2033       op_non_const = or_predicates (summary->conds, &p, &op_non_const);
2034     }
2035   if (gimple_code (stmt) == GIMPLE_ASSIGN
2036       && TREE_CODE (gimple_assign_lhs (stmt)) == SSA_NAME)
2037     nonconstant_names[SSA_NAME_VERSION (gimple_assign_lhs (stmt))]
2038       = op_non_const;
2039   return op_non_const;
2040 }
2041
2042 struct record_modified_bb_info
2043 {
2044   bitmap bb_set;
2045   gimple stmt;
2046 };
2047
2048 /* Callback of walk_aliased_vdefs.  Records basic blocks where the value may be
2049    set except for info->stmt.  */
2050
2051 static bool
2052 record_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef, void *data)
2053 {
2054   struct record_modified_bb_info *info =
2055     (struct record_modified_bb_info *) data;
2056   if (SSA_NAME_DEF_STMT (vdef) == info->stmt)
2057     return false;
2058   bitmap_set_bit (info->bb_set,
2059                   SSA_NAME_IS_DEFAULT_DEF (vdef)
2060                   ? ENTRY_BLOCK_PTR->index
2061                   : gimple_bb (SSA_NAME_DEF_STMT (vdef))->index);
2062   return false;
2063 }
2064
2065 /* Return probability (based on REG_BR_PROB_BASE) that I-th parameter of STMT
2066    will change since last invocation of STMT.
2067
2068    Value 0 is reserved for compile time invariants.
2069    For common parameters it is REG_BR_PROB_BASE.  For loop invariants it
2070    ought to be REG_BR_PROB_BASE / estimated_iters.  */
2071
2072 static int
2073 param_change_prob (gimple stmt, int i)
2074 {
2075   tree op = gimple_call_arg (stmt, i);
2076   basic_block bb = gimple_bb (stmt);
2077   tree base;
2078
2079   /* Global invariants neve change.  */
2080   if (is_gimple_min_invariant (op))
2081     return 0;
2082   /* We would have to do non-trivial analysis to really work out what
2083      is the probability of value to change (i.e. when init statement
2084      is in a sibling loop of the call).
2085
2086      We do an conservative estimate: when call is executed N times more often
2087      than the statement defining value, we take the frequency 1/N.  */
2088   if (TREE_CODE (op) == SSA_NAME)
2089     {
2090       int init_freq;
2091
2092       if (!bb->frequency)
2093         return REG_BR_PROB_BASE;
2094
2095       if (SSA_NAME_IS_DEFAULT_DEF (op))
2096         init_freq = ENTRY_BLOCK_PTR->frequency;
2097       else
2098         init_freq = gimple_bb (SSA_NAME_DEF_STMT (op))->frequency;
2099
2100       if (!init_freq)
2101         init_freq = 1;
2102       if (init_freq < bb->frequency)
2103         return MAX (GCOV_COMPUTE_SCALE (init_freq, bb->frequency), 1);
2104       else
2105         return REG_BR_PROB_BASE;
2106     }
2107
2108   base = get_base_address (op);
2109   if (base)
2110     {
2111       ao_ref refd;
2112       int max;
2113       struct record_modified_bb_info info;
2114       bitmap_iterator bi;
2115       unsigned index;
2116       tree init = ctor_for_folding (base);
2117
2118       if (init != error_mark_node)
2119         return 0;
2120       if (!bb->frequency)
2121         return REG_BR_PROB_BASE;
2122       ao_ref_init (&refd, op);
2123       info.stmt = stmt;
2124       info.bb_set = BITMAP_ALLOC (NULL);
2125       walk_aliased_vdefs (&refd, gimple_vuse (stmt), record_modified, &info,
2126                           NULL);
2127       if (bitmap_bit_p (info.bb_set, bb->index))
2128         {
2129           BITMAP_FREE (info.bb_set);
2130           return REG_BR_PROB_BASE;
2131         }
2132
2133       /* Assume that every memory is initialized at entry.
2134          TODO: Can we easilly determine if value is always defined
2135          and thus we may skip entry block?  */
2136       if (ENTRY_BLOCK_PTR->frequency)
2137         max = ENTRY_BLOCK_PTR->frequency;
2138       else
2139         max = 1;
2140
2141       EXECUTE_IF_SET_IN_BITMAP (info.bb_set, 0, index, bi)
2142         max = MIN (max, BASIC_BLOCK (index)->frequency);
2143
2144       BITMAP_FREE (info.bb_set);
2145       if (max < bb->frequency)
2146         return MAX (GCOV_COMPUTE_SCALE (max, bb->frequency), 1);
2147       else
2148         return REG_BR_PROB_BASE;
2149     }
2150   return REG_BR_PROB_BASE;
2151 }
2152
2153 /* Find whether a basic block BB is the final block of a (half) diamond CFG
2154    sub-graph and if the predicate the condition depends on is known.  If so,
2155    return true and store the pointer the predicate in *P.  */
2156
2157 static bool
2158 phi_result_unknown_predicate (struct ipa_node_params *info,
2159                               struct inline_summary *summary, basic_block bb,
2160                               struct predicate *p,
2161                               vec<predicate_t> nonconstant_names)
2162 {
2163   edge e;
2164   edge_iterator ei;
2165   basic_block first_bb = NULL;
2166   gimple stmt;
2167
2168   if (single_pred_p (bb))
2169     {
2170       *p = false_predicate ();
2171       return true;
2172     }
2173
2174   FOR_EACH_EDGE (e, ei, bb->preds)
2175     {
2176       if (single_succ_p (e->src))
2177         {
2178           if (!single_pred_p (e->src))
2179             return false;
2180           if (!first_bb)
2181             first_bb = single_pred (e->src);
2182           else if (single_pred (e->src) != first_bb)
2183             return false;
2184         }
2185       else
2186         {
2187           if (!first_bb)
2188             first_bb = e->src;
2189           else if (e->src != first_bb)
2190             return false;
2191         }
2192     }
2193
2194   if (!first_bb)
2195     return false;
2196
2197   stmt = last_stmt (first_bb);
2198   if (!stmt
2199       || gimple_code (stmt) != GIMPLE_COND
2200       || !is_gimple_ip_invariant (gimple_cond_rhs (stmt)))
2201     return false;
2202
2203   *p = will_be_nonconstant_expr_predicate (info, summary,
2204                                            gimple_cond_lhs (stmt),
2205                                            nonconstant_names);
2206   if (true_predicate_p (p))
2207     return false;
2208   else
2209     return true;
2210 }
2211
2212 /* Given a PHI statement in a function described by inline properties SUMMARY
2213    and *P being the predicate describing whether the selected PHI argument is
2214    known, store a predicate for the result of the PHI statement into
2215    NONCONSTANT_NAMES, if possible.  */
2216
2217 static void
2218 predicate_for_phi_result (struct inline_summary *summary, gimple phi,
2219                           struct predicate *p,
2220                           vec<predicate_t> nonconstant_names)
2221 {
2222   unsigned i;
2223
2224   for (i = 0; i < gimple_phi_num_args (phi); i++)
2225     {
2226       tree arg = gimple_phi_arg (phi, i)->def;
2227       if (!is_gimple_min_invariant (arg))
2228         {
2229           gcc_assert (TREE_CODE (arg) == SSA_NAME);
2230           *p = or_predicates (summary->conds, p,
2231                               &nonconstant_names[SSA_NAME_VERSION (arg)]);
2232           if (true_predicate_p (p))
2233             return;
2234         }
2235     }
2236
2237   if (dump_file && (dump_flags & TDF_DETAILS))
2238     {
2239       fprintf (dump_file, "\t\tphi predicate: ");
2240       dump_predicate (dump_file, summary->conds, p);
2241     }
2242   nonconstant_names[SSA_NAME_VERSION (gimple_phi_result (phi))] = *p;
2243 }
2244
2245 /* Return predicate specifying when array index in access OP becomes non-constant.  */
2246
2247 static struct predicate
2248 array_index_predicate (struct inline_summary *info,
2249                        vec< predicate_t> nonconstant_names, tree op)
2250 {
2251   struct predicate p = false_predicate ();
2252   while (handled_component_p (op))
2253     {
2254       if (TREE_CODE (op) == ARRAY_REF || TREE_CODE (op) == ARRAY_RANGE_REF)
2255         {
2256           if (TREE_CODE (TREE_OPERAND (op, 1)) == SSA_NAME)
2257             p = or_predicates (info->conds, &p,
2258                                &nonconstant_names[SSA_NAME_VERSION
2259                                                   (TREE_OPERAND (op, 1))]);
2260         }
2261       op = TREE_OPERAND (op, 0);
2262     }
2263   return p;
2264 }
2265
2266 /* For a typical usage of __builtin_expect (a<b, 1), we
2267    may introduce an extra relation stmt:
2268    With the builtin, we have
2269      t1 = a <= b;
2270      t2 = (long int) t1;
2271      t3 = __builtin_expect (t2, 1);
2272      if (t3 != 0)
2273        goto ...
2274    Without the builtin, we have
2275      if (a<=b)
2276        goto...
2277    This affects the size/time estimation and may have
2278    an impact on the earlier inlining.
2279    Here find this pattern and fix it up later.  */
2280
2281 static gimple
2282 find_foldable_builtin_expect (basic_block bb)
2283 {
2284   gimple_stmt_iterator bsi;
2285
2286   for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
2287     {
2288       gimple stmt = gsi_stmt (bsi);
2289       if (gimple_call_builtin_p (stmt, BUILT_IN_EXPECT))
2290         {
2291           tree var = gimple_call_lhs (stmt);
2292           tree arg = gimple_call_arg (stmt, 0);
2293           use_operand_p use_p;
2294           gimple use_stmt;
2295           bool match = false;
2296           bool done = false;
2297
2298           if (!var || !arg)
2299             continue;
2300           gcc_assert (TREE_CODE (var) == SSA_NAME);
2301
2302           while (TREE_CODE (arg) == SSA_NAME)
2303             {
2304               gimple stmt_tmp = SSA_NAME_DEF_STMT (arg);
2305               if (!is_gimple_assign (stmt_tmp))
2306                 break;
2307               switch (gimple_assign_rhs_code (stmt_tmp))
2308                 {
2309                   case LT_EXPR:
2310                   case LE_EXPR:
2311                   case GT_EXPR:
2312                   case GE_EXPR:
2313                   case EQ_EXPR:
2314                   case NE_EXPR:
2315                     match = true;
2316                     done = true;
2317                     break;
2318                   case NOP_EXPR:
2319                     break;
2320                   default:
2321                     done = true;
2322                     break;
2323                 }
2324               if (done)
2325                 break;
2326               arg = gimple_assign_rhs1 (stmt_tmp);
2327             }
2328
2329           if (match && single_imm_use (var, &use_p, &use_stmt)
2330               && gimple_code (use_stmt) == GIMPLE_COND)
2331             return use_stmt;
2332         }
2333     }
2334   return NULL;
2335 }
2336
2337 /* Compute function body size parameters for NODE.
2338    When EARLY is true, we compute only simple summaries without
2339    non-trivial predicates to drive the early inliner.  */
2340
2341 static void
2342 estimate_function_body_sizes (struct cgraph_node *node, bool early)
2343 {
2344   gcov_type time = 0;
2345   /* Estimate static overhead for function prologue/epilogue and alignment. */
2346   int size = 2;
2347   /* Benefits are scaled by probability of elimination that is in range
2348      <0,2>.  */
2349   basic_block bb;
2350   gimple_stmt_iterator bsi;
2351   struct function *my_function = DECL_STRUCT_FUNCTION (node->symbol.decl);
2352   int freq;
2353   struct inline_summary *info = inline_summary (node);
2354   struct predicate bb_predicate;
2355   struct ipa_node_params *parms_info = NULL;
2356   vec<predicate_t> nonconstant_names = vNULL;
2357   int nblocks, n;
2358   int *order;
2359   predicate array_index = true_predicate ();
2360   gimple fix_builtin_expect_stmt;
2361
2362   info->conds = NULL;
2363   info->entry = NULL;
2364
2365   if (optimize && !early)
2366     {
2367       calculate_dominance_info (CDI_DOMINATORS);
2368       loop_optimizer_init (LOOPS_NORMAL | LOOPS_HAVE_RECORDED_EXITS);
2369
2370       if (ipa_node_params_vector.exists ())
2371         {
2372           parms_info = IPA_NODE_REF (node);
2373           nonconstant_names.safe_grow_cleared
2374             (SSANAMES (my_function)->length ());
2375         }
2376     }
2377
2378   if (dump_file)
2379     fprintf (dump_file, "\nAnalyzing function body size: %s\n",
2380              cgraph_node_name (node));
2381
2382   /* When we run into maximal number of entries, we assign everything to the
2383      constant truth case.  Be sure to have it in list. */
2384   bb_predicate = true_predicate ();
2385   account_size_time (info, 0, 0, &bb_predicate);
2386
2387   bb_predicate = not_inlined_predicate ();
2388   account_size_time (info, 2 * INLINE_SIZE_SCALE, 0, &bb_predicate);
2389
2390   gcc_assert (my_function && my_function->cfg);
2391   if (parms_info)
2392     compute_bb_predicates (node, parms_info, info);
2393   gcc_assert (cfun == my_function);
2394   order = XNEWVEC (int, n_basic_blocks);
2395   nblocks = pre_and_rev_post_order_compute (NULL, order, false);
2396   for (n = 0; n < nblocks; n++)
2397     {
2398       bb = BASIC_BLOCK (order[n]);
2399       freq = compute_call_stmt_bb_frequency (node->symbol.decl, bb);
2400
2401       /* TODO: Obviously predicates can be propagated down across CFG.  */
2402       if (parms_info)
2403         {
2404           if (bb->aux)
2405             bb_predicate = *(struct predicate *) bb->aux;
2406           else
2407             bb_predicate = false_predicate ();
2408         }
2409       else
2410         bb_predicate = true_predicate ();
2411
2412       if (dump_file && (dump_flags & TDF_DETAILS))
2413         {
2414           fprintf (dump_file, "\n BB %i predicate:", bb->index);
2415           dump_predicate (dump_file, info->conds, &bb_predicate);
2416         }
2417
2418       if (parms_info && nonconstant_names.exists ())
2419         {
2420           struct predicate phi_predicate;
2421           bool first_phi = true;
2422
2423           for (bsi = gsi_start_phis (bb); !gsi_end_p (bsi); gsi_next (&bsi))
2424             {
2425               if (first_phi
2426                   && !phi_result_unknown_predicate (parms_info, info, bb,
2427                                                     &phi_predicate,
2428                                                     nonconstant_names))
2429                 break;
2430               first_phi = false;
2431               if (dump_file && (dump_flags & TDF_DETAILS))
2432                 {
2433                   fprintf (dump_file, "  ");
2434                   print_gimple_stmt (dump_file, gsi_stmt (bsi), 0, 0);
2435                 }
2436               predicate_for_phi_result (info, gsi_stmt (bsi), &phi_predicate,
2437                                         nonconstant_names);
2438             }
2439         }
2440
2441       fix_builtin_expect_stmt = find_foldable_builtin_expect (bb);
2442
2443       for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
2444         {
2445           gimple stmt = gsi_stmt (bsi);
2446           int this_size = estimate_num_insns (stmt, &eni_size_weights);
2447           int this_time = estimate_num_insns (stmt, &eni_time_weights);
2448           int prob;
2449           struct predicate will_be_nonconstant;
2450
2451           /* This relation stmt should be folded after we remove
2452              buildin_expect call. Adjust the cost here.  */
2453           if (stmt == fix_builtin_expect_stmt)
2454             {
2455               this_size--;
2456               this_time--;
2457             }
2458
2459           if (dump_file && (dump_flags & TDF_DETAILS))
2460             {
2461               fprintf (dump_file, "  ");
2462               print_gimple_stmt (dump_file, stmt, 0, 0);
2463               fprintf (dump_file, "\t\tfreq:%3.2f size:%3i time:%3i\n",
2464                        ((double) freq) / CGRAPH_FREQ_BASE, this_size,
2465                        this_time);
2466             }
2467
2468           if (gimple_assign_load_p (stmt) && nonconstant_names.exists ())
2469             {
2470               struct predicate this_array_index;
2471               this_array_index =
2472                 array_index_predicate (info, nonconstant_names,
2473                                        gimple_assign_rhs1 (stmt));
2474               if (!false_predicate_p (&this_array_index))
2475                 array_index =
2476                   and_predicates (info->conds, &array_index,
2477                                   &this_array_index);
2478             }
2479           if (gimple_store_p (stmt) && nonconstant_names.exists ())
2480             {
2481               struct predicate this_array_index;
2482               this_array_index =
2483                 array_index_predicate (info, nonconstant_names,
2484                                        gimple_get_lhs (stmt));
2485               if (!false_predicate_p (&this_array_index))
2486                 array_index =
2487                   and_predicates (info->conds, &array_index,
2488                                   &this_array_index);
2489             }
2490
2491
2492           if (is_gimple_call (stmt))
2493             {
2494               struct cgraph_edge *edge = cgraph_edge (node, stmt);
2495               struct inline_edge_summary *es = inline_edge_summary (edge);
2496
2497               /* Special case: results of BUILT_IN_CONSTANT_P will be always
2498                  resolved as constant.  We however don't want to optimize
2499                  out the cgraph edges.  */
2500               if (nonconstant_names.exists ()
2501                   && gimple_call_builtin_p (stmt, BUILT_IN_CONSTANT_P)
2502                   && gimple_call_lhs (stmt)
2503                   && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
2504                 {
2505                   struct predicate false_p = false_predicate ();
2506                   nonconstant_names[SSA_NAME_VERSION (gimple_call_lhs (stmt))]
2507                     = false_p;
2508                 }
2509               if (ipa_node_params_vector.exists ())
2510                 {
2511                   int count = gimple_call_num_args (stmt);
2512                   int i;
2513
2514                   if (count)
2515                     es->param.safe_grow_cleared (count);
2516                   for (i = 0; i < count; i++)
2517                     {
2518                       int prob = param_change_prob (stmt, i);
2519                       gcc_assert (prob >= 0 && prob <= REG_BR_PROB_BASE);
2520                       es->param[i].change_prob = prob;
2521                     }
2522                 }
2523
2524               es->call_stmt_size = this_size;
2525               es->call_stmt_time = this_time;
2526               es->loop_depth = bb_loop_depth (bb);
2527               edge_set_predicate (edge, &bb_predicate);
2528             }
2529
2530           /* TODO: When conditional jump or swithc is known to be constant, but
2531              we did not translate it into the predicates, we really can account
2532              just maximum of the possible paths.  */
2533           if (parms_info)
2534             will_be_nonconstant
2535               = will_be_nonconstant_predicate (parms_info, info,
2536                                                stmt, nonconstant_names);
2537           if (this_time || this_size)
2538             {
2539               struct predicate p;
2540
2541               this_time *= freq;
2542
2543               prob = eliminated_by_inlining_prob (stmt);
2544               if (prob == 1 && dump_file && (dump_flags & TDF_DETAILS))
2545                 fprintf (dump_file,
2546                          "\t\t50%% will be eliminated by inlining\n");
2547               if (prob == 2 && dump_file && (dump_flags & TDF_DETAILS))
2548                 fprintf (dump_file, "\t\tWill be eliminated by inlining\n");
2549
2550               if (parms_info)
2551                 p = and_predicates (info->conds, &bb_predicate,
2552                                     &will_be_nonconstant);
2553               else
2554                 p = true_predicate ();
2555
2556               if (!false_predicate_p (&p))
2557                 {
2558                   time += this_time;
2559                   size += this_size;
2560                   if (time > MAX_TIME * INLINE_TIME_SCALE)
2561                     time = MAX_TIME * INLINE_TIME_SCALE;
2562                 }
2563
2564               /* We account everything but the calls.  Calls have their own
2565                  size/time info attached to cgraph edges.  This is necessary
2566                  in order to make the cost disappear after inlining.  */
2567               if (!is_gimple_call (stmt))
2568                 {
2569                   if (prob)
2570                     {
2571                       struct predicate ip = not_inlined_predicate ();
2572                       ip = and_predicates (info->conds, &ip, &p);
2573                       account_size_time (info, this_size * prob,
2574                                          this_time * prob, &ip);
2575                     }
2576                   if (prob != 2)
2577                     account_size_time (info, this_size * (2 - prob),
2578                                        this_time * (2 - prob), &p);
2579                 }
2580
2581               gcc_assert (time >= 0);
2582               gcc_assert (size >= 0);
2583             }
2584         }
2585     }
2586   set_hint_predicate (&inline_summary (node)->array_index, array_index);
2587   time = (time + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
2588   if (time > MAX_TIME)
2589     time = MAX_TIME;
2590   free (order);
2591
2592   if (!early && nonconstant_names.exists ())
2593     {
2594       struct loop *loop;
2595       loop_iterator li;
2596       predicate loop_iterations = true_predicate ();
2597       predicate loop_stride = true_predicate ();
2598
2599       if (dump_file && (dump_flags & TDF_DETAILS))
2600         flow_loops_dump (dump_file, NULL, 0);
2601       scev_initialize ();
2602       FOR_EACH_LOOP (li, loop, 0)
2603         {
2604           vec<edge> exits;
2605           edge ex;
2606           unsigned int j, i;
2607           struct tree_niter_desc niter_desc;
2608           basic_block *body = get_loop_body (loop);
2609           bb_predicate = *(struct predicate *) loop->header->aux;
2610
2611           exits = get_loop_exit_edges (loop);
2612           FOR_EACH_VEC_ELT (exits, j, ex)
2613             if (number_of_iterations_exit (loop, ex, &niter_desc, false)
2614                 && !is_gimple_min_invariant (niter_desc.niter))
2615             {
2616               predicate will_be_nonconstant
2617                 = will_be_nonconstant_expr_predicate (parms_info, info,
2618                                                       niter_desc.niter,
2619                                                       nonconstant_names);
2620               if (!true_predicate_p (&will_be_nonconstant))
2621                 will_be_nonconstant = and_predicates (info->conds,
2622                                                       &bb_predicate,
2623                                                       &will_be_nonconstant);
2624               if (!true_predicate_p (&will_be_nonconstant)
2625                   && !false_predicate_p (&will_be_nonconstant))
2626                 /* This is slightly inprecise.  We may want to represent each
2627                    loop with independent predicate.  */
2628                 loop_iterations =
2629                   and_predicates (info->conds, &loop_iterations,
2630                                   &will_be_nonconstant);
2631             }
2632           exits.release ();
2633
2634           for (i = 0; i < loop->num_nodes; i++)
2635             {
2636               gimple_stmt_iterator gsi;
2637               bb_predicate = *(struct predicate *) body[i]->aux;
2638               for (gsi = gsi_start_bb (body[i]); !gsi_end_p (gsi);
2639                    gsi_next (&gsi))
2640                 {
2641                   gimple stmt = gsi_stmt (gsi);
2642                   affine_iv iv;
2643                   ssa_op_iter iter;
2644                   tree use;
2645
2646                   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2647                   {
2648                     predicate will_be_nonconstant;
2649
2650                     if (!simple_iv
2651                         (loop, loop_containing_stmt (stmt), use, &iv, true)
2652                         || is_gimple_min_invariant (iv.step))
2653                       continue;
2654                     will_be_nonconstant
2655                       = will_be_nonconstant_expr_predicate (parms_info, info,
2656                                                             iv.step,
2657                                                             nonconstant_names);
2658                     if (!true_predicate_p (&will_be_nonconstant))
2659                       will_be_nonconstant
2660                          = and_predicates (info->conds,
2661                                            &bb_predicate,
2662                                            &will_be_nonconstant);
2663                     if (!true_predicate_p (&will_be_nonconstant)
2664                         && !false_predicate_p (&will_be_nonconstant))
2665                       /* This is slightly inprecise.  We may want to represent
2666                          each loop with independent predicate.  */
2667                       loop_stride =
2668                         and_predicates (info->conds, &loop_stride,
2669                                         &will_be_nonconstant);
2670                   }
2671                 }
2672             }
2673           free (body);
2674         }
2675       set_hint_predicate (&inline_summary (node)->loop_iterations,
2676                           loop_iterations);
2677       set_hint_predicate (&inline_summary (node)->loop_stride, loop_stride);
2678       scev_finalize ();
2679     }
2680   FOR_ALL_BB_FN (bb, my_function)
2681     {
2682       edge e;
2683       edge_iterator ei;
2684
2685       if (bb->aux)
2686         pool_free (edge_predicate_pool, bb->aux);
2687       bb->aux = NULL;
2688       FOR_EACH_EDGE (e, ei, bb->succs)
2689         {
2690           if (e->aux)
2691             pool_free (edge_predicate_pool, e->aux);
2692           e->aux = NULL;
2693         }
2694     }
2695   inline_summary (node)->self_time = time;
2696   inline_summary (node)->self_size = size;
2697   nonconstant_names.release ();
2698   if (optimize && !early)
2699     {
2700       loop_optimizer_finalize ();
2701       free_dominance_info (CDI_DOMINATORS);
2702     }
2703   if (dump_file)
2704     {
2705       fprintf (dump_file, "\n");
2706       dump_inline_summary (dump_file, node);
2707     }
2708 }
2709
2710
2711 /* Compute parameters of functions used by inliner.
2712    EARLY is true when we compute parameters for the early inliner  */
2713
2714 void
2715 compute_inline_parameters (struct cgraph_node *node, bool early)
2716 {
2717   HOST_WIDE_INT self_stack_size;
2718   struct cgraph_edge *e;
2719   struct inline_summary *info;
2720
2721   gcc_assert (!node->global.inlined_to);
2722
2723   inline_summary_alloc ();
2724
2725   info = inline_summary (node);
2726   reset_inline_summary (node);
2727
2728   /* FIXME: Thunks are inlinable, but tree-inline don't know how to do that.
2729      Once this happen, we will need to more curefully predict call
2730      statement size.  */
2731   if (node->thunk.thunk_p)
2732     {
2733       struct inline_edge_summary *es = inline_edge_summary (node->callees);
2734       struct predicate t = true_predicate ();
2735
2736       info->inlinable = 0;
2737       node->callees->call_stmt_cannot_inline_p = true;
2738       node->local.can_change_signature = false;
2739       es->call_stmt_time = 1;
2740       es->call_stmt_size = 1;
2741       account_size_time (info, 0, 0, &t);
2742       return;
2743     }
2744
2745   /* Even is_gimple_min_invariant rely on current_function_decl.  */
2746   push_cfun (DECL_STRUCT_FUNCTION (node->symbol.decl));
2747
2748   /* Estimate the stack size for the function if we're optimizing.  */
2749   self_stack_size = optimize ? estimated_stack_frame_size (node) : 0;
2750   info->estimated_self_stack_size = self_stack_size;
2751   info->estimated_stack_size = self_stack_size;
2752   info->stack_frame_offset = 0;
2753
2754   /* Can this function be inlined at all?  */
2755   if (!optimize && !lookup_attribute ("always_inline",
2756                                       DECL_ATTRIBUTES (node->symbol.decl)))
2757     info->inlinable = false;
2758   else
2759     info->inlinable = tree_inlinable_function_p (node->symbol.decl);
2760
2761   /* Type attributes can use parameter indices to describe them.  */
2762   if (TYPE_ATTRIBUTES (TREE_TYPE (node->symbol.decl)))
2763     node->local.can_change_signature = false;
2764   else
2765     {
2766       /* Otherwise, inlinable functions always can change signature.  */
2767       if (info->inlinable)
2768         node->local.can_change_signature = true;
2769       else
2770         {
2771           /* Functions calling builtin_apply can not change signature.  */
2772           for (e = node->callees; e; e = e->next_callee)
2773             {
2774               tree cdecl = e->callee->symbol.decl;
2775               if (DECL_BUILT_IN (cdecl)
2776                   && DECL_BUILT_IN_CLASS (cdecl) == BUILT_IN_NORMAL
2777                   && (DECL_FUNCTION_CODE (cdecl) == BUILT_IN_APPLY_ARGS
2778                       || DECL_FUNCTION_CODE (cdecl) == BUILT_IN_VA_START))
2779                 break;
2780             }
2781           node->local.can_change_signature = !e;
2782         }
2783     }
2784   estimate_function_body_sizes (node, early);
2785
2786   /* Inlining characteristics are maintained by the cgraph_mark_inline.  */
2787   info->time = info->self_time;
2788   info->size = info->self_size;
2789   info->stack_frame_offset = 0;
2790   info->estimated_stack_size = info->estimated_self_stack_size;
2791 #ifdef ENABLE_CHECKING
2792   inline_update_overall_summary (node);
2793   gcc_assert (info->time == info->self_time && info->size == info->self_size);
2794 #endif
2795
2796   pop_cfun ();
2797 }
2798
2799
2800 /* Compute parameters of functions used by inliner using
2801    current_function_decl.  */
2802
2803 static unsigned int
2804 compute_inline_parameters_for_current (void)
2805 {
2806   compute_inline_parameters (cgraph_get_node (current_function_decl), true);
2807   return 0;
2808 }
2809
2810 namespace {
2811
2812 const pass_data pass_data_inline_parameters =
2813 {
2814   GIMPLE_PASS, /* type */
2815   "inline_param", /* name */
2816   OPTGROUP_INLINE, /* optinfo_flags */
2817   false, /* has_gate */
2818   true, /* has_execute */
2819   TV_INLINE_PARAMETERS, /* tv_id */
2820   0, /* properties_required */
2821   0, /* properties_provided */
2822   0, /* properties_destroyed */
2823   0, /* todo_flags_start */
2824   0, /* todo_flags_finish */
2825 };
2826
2827 class pass_inline_parameters : public gimple_opt_pass
2828 {
2829 public:
2830   pass_inline_parameters (gcc::context *ctxt)
2831     : gimple_opt_pass (pass_data_inline_parameters, ctxt)
2832   {}
2833
2834   /* opt_pass methods: */
2835   opt_pass * clone () { return new pass_inline_parameters (m_ctxt); }
2836   unsigned int execute () {
2837     return compute_inline_parameters_for_current ();
2838   }
2839
2840 }; // class pass_inline_parameters
2841
2842 } // anon namespace
2843
2844 gimple_opt_pass *
2845 make_pass_inline_parameters (gcc::context *ctxt)
2846 {
2847   return new pass_inline_parameters (ctxt);
2848 }
2849
2850
2851 /* Estimate benefit devirtualizing indirect edge IE, provided KNOWN_VALS and
2852    KNOWN_BINFOS.  */
2853
2854 static bool
2855 estimate_edge_devirt_benefit (struct cgraph_edge *ie,
2856                               int *size, int *time,
2857                               vec<tree> known_vals,
2858                               vec<tree> known_binfos,
2859                               vec<ipa_agg_jump_function_p> known_aggs)
2860 {
2861   tree target;
2862   struct cgraph_node *callee;
2863   struct inline_summary *isummary;
2864
2865   if (!known_vals.exists () && !known_binfos.exists ())
2866     return false;
2867   if (!flag_indirect_inlining)
2868     return false;
2869
2870   target = ipa_get_indirect_edge_target (ie, known_vals, known_binfos,
2871                                          known_aggs);
2872   if (!target)
2873     return false;
2874
2875   /* Account for difference in cost between indirect and direct calls.  */
2876   *size -= (eni_size_weights.indirect_call_cost - eni_size_weights.call_cost);
2877   *time -= (eni_time_weights.indirect_call_cost - eni_time_weights.call_cost);
2878   gcc_checking_assert (*time >= 0);
2879   gcc_checking_assert (*size >= 0);
2880
2881   callee = cgraph_get_node (target);
2882   if (!callee || !callee->symbol.definition)
2883     return false;
2884   isummary = inline_summary (callee);
2885   return isummary->inlinable;
2886 }
2887
2888 /* Increase SIZE and TIME for size and time needed to handle edge E.  */
2889
2890 static inline void
2891 estimate_edge_size_and_time (struct cgraph_edge *e, int *size, int *time,
2892                              int prob,
2893                              vec<tree> known_vals,
2894                              vec<tree> known_binfos,
2895                              vec<ipa_agg_jump_function_p> known_aggs,
2896                              inline_hints *hints)
2897 {
2898   struct inline_edge_summary *es = inline_edge_summary (e);
2899   int call_size = es->call_stmt_size;
2900   int call_time = es->call_stmt_time;
2901   if (!e->callee
2902       && estimate_edge_devirt_benefit (e, &call_size, &call_time,
2903                                        known_vals, known_binfos, known_aggs)
2904       && hints && cgraph_maybe_hot_edge_p (e))
2905     *hints |= INLINE_HINT_indirect_call;
2906   *size += call_size * INLINE_SIZE_SCALE;
2907   *time += apply_probability ((gcov_type) call_time, prob)
2908     * e->frequency * (INLINE_TIME_SCALE / CGRAPH_FREQ_BASE);
2909   if (*time > MAX_TIME * INLINE_TIME_SCALE)
2910     *time = MAX_TIME * INLINE_TIME_SCALE;
2911 }
2912
2913
2914
2915 /* Increase SIZE and TIME for size and time needed to handle all calls in NODE.
2916    POSSIBLE_TRUTHS, KNOWN_VALS and KNOWN_BINFOS describe context of the call
2917    site.  */
2918
2919 static void
2920 estimate_calls_size_and_time (struct cgraph_node *node, int *size, int *time,
2921                               inline_hints *hints,
2922                               clause_t possible_truths,
2923                               vec<tree> known_vals,
2924                               vec<tree> known_binfos,
2925                               vec<ipa_agg_jump_function_p> known_aggs)
2926 {
2927   struct cgraph_edge *e;
2928   for (e = node->callees; e; e = e->next_callee)
2929     {
2930       struct inline_edge_summary *es = inline_edge_summary (e);
2931       if (!es->predicate
2932           || evaluate_predicate (es->predicate, possible_truths))
2933         {
2934           if (e->inline_failed)
2935             {
2936               /* Predicates of calls shall not use NOT_CHANGED codes,
2937                  sowe do not need to compute probabilities.  */
2938               estimate_edge_size_and_time (e, size, time, REG_BR_PROB_BASE,
2939                                            known_vals, known_binfos,
2940                                            known_aggs, hints);
2941             }
2942           else
2943             estimate_calls_size_and_time (e->callee, size, time, hints,
2944                                           possible_truths,
2945                                           known_vals, known_binfos,
2946                                           known_aggs);
2947         }
2948     }
2949   for (e = node->indirect_calls; e; e = e->next_callee)
2950     {
2951       struct inline_edge_summary *es = inline_edge_summary (e);
2952       if (!es->predicate
2953           || evaluate_predicate (es->predicate, possible_truths))
2954         estimate_edge_size_and_time (e, size, time, REG_BR_PROB_BASE,
2955                                      known_vals, known_binfos, known_aggs,
2956                                      hints);
2957     }
2958 }
2959
2960
2961 /* Estimate size and time needed to execute NODE assuming
2962    POSSIBLE_TRUTHS clause, and KNOWN_VALS and KNOWN_BINFOS information
2963    about NODE's arguments. */
2964
2965 static void
2966 estimate_node_size_and_time (struct cgraph_node *node,
2967                              clause_t possible_truths,
2968                              vec<tree> known_vals,
2969                              vec<tree> known_binfos,
2970                              vec<ipa_agg_jump_function_p> known_aggs,
2971                              int *ret_size, int *ret_time,
2972                              inline_hints *ret_hints,
2973                              vec<inline_param_summary_t>
2974                              inline_param_summary)
2975 {
2976   struct inline_summary *info = inline_summary (node);
2977   size_time_entry *e;
2978   int size = 0;
2979   int time = 0;
2980   inline_hints hints = 0;
2981   int i;
2982
2983   if (dump_file && (dump_flags & TDF_DETAILS))
2984     {
2985       bool found = false;
2986       fprintf (dump_file, "   Estimating body: %s/%i\n"
2987                "   Known to be false: ", cgraph_node_name (node),
2988                node->symbol.order);
2989
2990       for (i = predicate_not_inlined_condition;
2991            i < (predicate_first_dynamic_condition
2992                 + (int) vec_safe_length (info->conds)); i++)
2993         if (!(possible_truths & (1 << i)))
2994           {
2995             if (found)
2996               fprintf (dump_file, ", ");
2997             found = true;
2998             dump_condition (dump_file, info->conds, i);
2999           }
3000     }
3001
3002   for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
3003     if (evaluate_predicate (&e->predicate, possible_truths))
3004       {
3005         size += e->size;
3006         gcc_checking_assert (e->time >= 0);
3007         gcc_checking_assert (time >= 0);
3008         if (!inline_param_summary.exists ())
3009           time += e->time;
3010         else
3011           {
3012             int prob = predicate_probability (info->conds,
3013                                               &e->predicate,
3014                                               possible_truths,
3015                                               inline_param_summary);
3016             gcc_checking_assert (prob >= 0);
3017             gcc_checking_assert (prob <= REG_BR_PROB_BASE);
3018             time += apply_probability ((gcov_type) e->time, prob);
3019           }
3020         if (time > MAX_TIME * INLINE_TIME_SCALE)
3021           time = MAX_TIME * INLINE_TIME_SCALE;
3022         gcc_checking_assert (time >= 0);
3023
3024       }
3025   gcc_checking_assert (size >= 0);
3026   gcc_checking_assert (time >= 0);
3027
3028   if (info->loop_iterations
3029       && !evaluate_predicate (info->loop_iterations, possible_truths))
3030     hints |= INLINE_HINT_loop_iterations;
3031   if (info->loop_stride
3032       && !evaluate_predicate (info->loop_stride, possible_truths))
3033     hints |= INLINE_HINT_loop_stride;
3034   if (info->array_index
3035       && !evaluate_predicate (info->array_index, possible_truths))
3036     hints |= INLINE_HINT_array_index;
3037   if (info->scc_no)
3038     hints |= INLINE_HINT_in_scc;
3039   if (DECL_DECLARED_INLINE_P (node->symbol.decl))
3040     hints |= INLINE_HINT_declared_inline;
3041
3042   estimate_calls_size_and_time (node, &size, &time, &hints, possible_truths,
3043                                 known_vals, known_binfos, known_aggs);
3044   gcc_checking_assert (size >= 0);
3045   gcc_checking_assert (time >= 0);
3046   time = RDIV (time, INLINE_TIME_SCALE);
3047   size = RDIV (size, INLINE_SIZE_SCALE);
3048
3049   if (dump_file && (dump_flags & TDF_DETAILS))
3050     fprintf (dump_file, "\n   size:%i time:%i\n", (int) size, (int) time);
3051   if (ret_time)
3052     *ret_time = time;
3053   if (ret_size)
3054     *ret_size = size;
3055   if (ret_hints)
3056     *ret_hints = hints;
3057   return;
3058 }
3059
3060
3061 /* Estimate size and time needed to execute callee of EDGE assuming that
3062    parameters known to be constant at caller of EDGE are propagated.
3063    KNOWN_VALS and KNOWN_BINFOS are vectors of assumed known constant values
3064    and types for parameters.  */
3065
3066 void
3067 estimate_ipcp_clone_size_and_time (struct cgraph_node *node,
3068                                    vec<tree> known_vals,
3069                                    vec<tree> known_binfos,
3070                                    vec<ipa_agg_jump_function_p> known_aggs,
3071                                    int *ret_size, int *ret_time,
3072                                    inline_hints *hints)
3073 {
3074   clause_t clause;
3075
3076   clause = evaluate_conditions_for_known_args (node, false, known_vals,
3077                                                known_aggs);
3078   estimate_node_size_and_time (node, clause, known_vals, known_binfos,
3079                                known_aggs, ret_size, ret_time, hints, vNULL);
3080 }
3081
3082 /* Translate all conditions from callee representation into caller
3083    representation and symbolically evaluate predicate P into new predicate.
3084
3085    INFO is inline_summary of function we are adding predicate into, CALLEE_INFO
3086    is summary of function predicate P is from. OPERAND_MAP is array giving
3087    callee formal IDs the caller formal IDs. POSSSIBLE_TRUTHS is clausule of all
3088    callee conditions that may be true in caller context.  TOPLEV_PREDICATE is
3089    predicate under which callee is executed.  OFFSET_MAP is an array of of
3090    offsets that need to be added to conditions, negative offset means that
3091    conditions relying on values passed by reference have to be discarded
3092    because they might not be preserved (and should be considered offset zero
3093    for other purposes).  */
3094
3095 static struct predicate
3096 remap_predicate (struct inline_summary *info,
3097                  struct inline_summary *callee_info,
3098                  struct predicate *p,
3099                  vec<int> operand_map,
3100                  vec<int> offset_map,
3101                  clause_t possible_truths, struct predicate *toplev_predicate)
3102 {
3103   int i;
3104   struct predicate out = true_predicate ();
3105
3106   /* True predicate is easy.  */
3107   if (true_predicate_p (p))
3108     return *toplev_predicate;
3109   for (i = 0; p->clause[i]; i++)
3110     {
3111       clause_t clause = p->clause[i];
3112       int cond;
3113       struct predicate clause_predicate = false_predicate ();
3114
3115       gcc_assert (i < MAX_CLAUSES);
3116
3117       for (cond = 0; cond < NUM_CONDITIONS; cond++)
3118         /* Do we have condition we can't disprove?   */
3119         if (clause & possible_truths & (1 << cond))
3120           {
3121             struct predicate cond_predicate;
3122             /* Work out if the condition can translate to predicate in the
3123                inlined function.  */
3124             if (cond >= predicate_first_dynamic_condition)
3125               {
3126                 struct condition *c;
3127
3128                 c = &(*callee_info->conds)[cond
3129                                            -
3130                                            predicate_first_dynamic_condition];
3131                 /* See if we can remap condition operand to caller's operand.
3132                    Otherwise give up.  */
3133                 if (!operand_map.exists ()
3134                     || (int) operand_map.length () <= c->operand_num
3135                     || operand_map[c->operand_num] == -1
3136                     /* TODO: For non-aggregate conditions, adding an offset is
3137                        basically an arithmetic jump function processing which
3138                        we should support in future.  */
3139                     || ((!c->agg_contents || !c->by_ref)
3140                         && offset_map[c->operand_num] > 0)
3141                     || (c->agg_contents && c->by_ref
3142                         && offset_map[c->operand_num] < 0))
3143                   cond_predicate = true_predicate ();
3144                 else
3145                   {
3146                     struct agg_position_info ap;
3147                     HOST_WIDE_INT offset_delta = offset_map[c->operand_num];
3148                     if (offset_delta < 0)
3149                       {
3150                         gcc_checking_assert (!c->agg_contents || !c->by_ref);
3151                         offset_delta = 0;
3152                       }
3153                     gcc_assert (!c->agg_contents
3154                                 || c->by_ref || offset_delta == 0);
3155                     ap.offset = c->offset + offset_delta;
3156                     ap.agg_contents = c->agg_contents;
3157                     ap.by_ref = c->by_ref;
3158                     cond_predicate = add_condition (info,
3159                                                     operand_map[c->operand_num],
3160                                                     &ap, c->code, c->val);
3161                   }
3162               }
3163             /* Fixed conditions remains same, construct single
3164                condition predicate.  */
3165             else
3166               {
3167                 cond_predicate.clause[0] = 1 << cond;
3168                 cond_predicate.clause[1] = 0;
3169               }
3170             clause_predicate = or_predicates (info->conds, &clause_predicate,
3171                                               &cond_predicate);
3172           }
3173       out = and_predicates (info->conds, &out, &clause_predicate);
3174     }
3175   return and_predicates (info->conds, &out, toplev_predicate);
3176 }
3177
3178
3179 /* Update summary information of inline clones after inlining.
3180    Compute peak stack usage.  */
3181
3182 static void
3183 inline_update_callee_summaries (struct cgraph_node *node, int depth)
3184 {
3185   struct cgraph_edge *e;
3186   struct inline_summary *callee_info = inline_summary (node);
3187   struct inline_summary *caller_info = inline_summary (node->callers->caller);
3188   HOST_WIDE_INT peak;
3189
3190   callee_info->stack_frame_offset
3191     = caller_info->stack_frame_offset
3192     + caller_info->estimated_self_stack_size;
3193   peak = callee_info->stack_frame_offset
3194     + callee_info->estimated_self_stack_size;
3195   if (inline_summary (node->global.inlined_to)->estimated_stack_size < peak)
3196       inline_summary (node->global.inlined_to)->estimated_stack_size = peak;
3197   ipa_propagate_frequency (node);
3198   for (e = node->callees; e; e = e->next_callee)
3199     {
3200       if (!e->inline_failed)
3201         inline_update_callee_summaries (e->callee, depth);
3202       inline_edge_summary (e)->loop_depth += depth;
3203     }
3204   for (e = node->indirect_calls; e; e = e->next_callee)
3205     inline_edge_summary (e)->loop_depth += depth;
3206 }
3207
3208 /* Update change_prob of EDGE after INLINED_EDGE has been inlined.
3209    When functoin A is inlined in B and A calls C with parameter that
3210    changes with probability PROB1 and C is known to be passthroug
3211    of argument if B that change with probability PROB2, the probability
3212    of change is now PROB1*PROB2.  */
3213
3214 static void
3215 remap_edge_change_prob (struct cgraph_edge *inlined_edge,
3216                         struct cgraph_edge *edge)
3217 {
3218   if (ipa_node_params_vector.exists ())
3219     {
3220       int i;
3221       struct ipa_edge_args *args = IPA_EDGE_REF (edge);
3222       struct inline_edge_summary *es = inline_edge_summary (edge);
3223       struct inline_edge_summary *inlined_es
3224         = inline_edge_summary (inlined_edge);
3225
3226       for (i = 0; i < ipa_get_cs_argument_count (args); i++)
3227         {
3228           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3229           if (jfunc->type == IPA_JF_PASS_THROUGH
3230               && (ipa_get_jf_pass_through_formal_id (jfunc)
3231                   < (int) inlined_es->param.length ()))
3232             {
3233               int jf_formal_id = ipa_get_jf_pass_through_formal_id (jfunc);
3234               int prob1 = es->param[i].change_prob;
3235               int prob2 = inlined_es->param[jf_formal_id].change_prob;
3236               int prob = combine_probabilities (prob1, prob2);
3237
3238               if (prob1 && prob2 && !prob)
3239                 prob = 1;
3240
3241               es->param[i].change_prob = prob;
3242             }
3243         }
3244     }
3245 }
3246
3247 /* Update edge summaries of NODE after INLINED_EDGE has been inlined.
3248
3249    Remap predicates of callees of NODE.  Rest of arguments match
3250    remap_predicate.
3251
3252    Also update change probabilities.  */
3253
3254 static void
3255 remap_edge_summaries (struct cgraph_edge *inlined_edge,
3256                       struct cgraph_node *node,
3257                       struct inline_summary *info,
3258                       struct inline_summary *callee_info,
3259                       vec<int> operand_map,
3260                       vec<int> offset_map,
3261                       clause_t possible_truths,
3262                       struct predicate *toplev_predicate)
3263 {
3264   struct cgraph_edge *e;
3265   for (e = node->callees; e; e = e->next_callee)
3266     {
3267       struct inline_edge_summary *es = inline_edge_summary (e);
3268       struct predicate p;
3269
3270       if (e->inline_failed)
3271         {
3272           remap_edge_change_prob (inlined_edge, e);
3273
3274           if (es->predicate)
3275             {
3276               p = remap_predicate (info, callee_info,
3277                                    es->predicate, operand_map, offset_map,
3278                                    possible_truths, toplev_predicate);
3279               edge_set_predicate (e, &p);
3280               /* TODO: We should remove the edge for code that will be
3281                  optimized out, but we need to keep verifiers and tree-inline
3282                  happy.  Make it cold for now.  */
3283               if (false_predicate_p (&p))
3284                 {
3285                   e->count = 0;
3286                   e->frequency = 0;
3287                 }
3288             }
3289           else
3290             edge_set_predicate (e, toplev_predicate);
3291         }
3292       else
3293         remap_edge_summaries (inlined_edge, e->callee, info, callee_info,
3294                               operand_map, offset_map, possible_truths,
3295                               toplev_predicate);
3296     }
3297   for (e = node->indirect_calls; e; e = e->next_callee)
3298     {
3299       struct inline_edge_summary *es = inline_edge_summary (e);
3300       struct predicate p;
3301
3302       remap_edge_change_prob (inlined_edge, e);
3303       if (es->predicate)
3304         {
3305           p = remap_predicate (info, callee_info,
3306                                es->predicate, operand_map, offset_map,
3307                                possible_truths, toplev_predicate);
3308           edge_set_predicate (e, &p);
3309           /* TODO: We should remove the edge for code that will be optimized
3310              out, but we need to keep verifiers and tree-inline happy.
3311              Make it cold for now.  */
3312           if (false_predicate_p (&p))
3313             {
3314               e->count = 0;
3315               e->frequency = 0;
3316             }
3317         }
3318       else
3319         edge_set_predicate (e, toplev_predicate);
3320     }
3321 }
3322
3323 /* Same as remap_predicate, but set result into hint *HINT.  */
3324
3325 static void
3326 remap_hint_predicate (struct inline_summary *info,
3327                       struct inline_summary *callee_info,
3328                       struct predicate **hint,
3329                       vec<int> operand_map,
3330                       vec<int> offset_map,
3331                       clause_t possible_truths,
3332                       struct predicate *toplev_predicate)
3333 {
3334   predicate p;
3335
3336   if (!*hint)
3337     return;
3338   p = remap_predicate (info, callee_info,
3339                        *hint,
3340                        operand_map, offset_map,
3341                        possible_truths, toplev_predicate);
3342   if (!false_predicate_p (&p) && !true_predicate_p (&p))
3343     {
3344       if (!*hint)
3345         set_hint_predicate (hint, p);
3346       else
3347         **hint = and_predicates (info->conds, *hint, &p);
3348     }
3349 }
3350
3351 /* We inlined EDGE.  Update summary of the function we inlined into.  */
3352
3353 void
3354 inline_merge_summary (struct cgraph_edge *edge)
3355 {
3356   struct inline_summary *callee_info = inline_summary (edge->callee);
3357   struct cgraph_node *to = (edge->caller->global.inlined_to
3358                             ? edge->caller->global.inlined_to : edge->caller);
3359   struct inline_summary *info = inline_summary (to);
3360   clause_t clause = 0;          /* not_inline is known to be false.  */
3361   size_time_entry *e;
3362   vec<int> operand_map = vNULL;
3363   vec<int> offset_map = vNULL;
3364   int i;
3365   struct predicate toplev_predicate;
3366   struct predicate true_p = true_predicate ();
3367   struct inline_edge_summary *es = inline_edge_summary (edge);
3368
3369   if (es->predicate)
3370     toplev_predicate = *es->predicate;
3371   else
3372     toplev_predicate = true_predicate ();
3373
3374   if (ipa_node_params_vector.exists () && callee_info->conds)
3375     {
3376       struct ipa_edge_args *args = IPA_EDGE_REF (edge);
3377       int count = ipa_get_cs_argument_count (args);
3378       int i;
3379
3380       evaluate_properties_for_edge (edge, true, &clause, NULL, NULL, NULL);
3381       if (count)
3382         {
3383           operand_map.safe_grow_cleared (count);
3384           offset_map.safe_grow_cleared (count);
3385         }
3386       for (i = 0; i < count; i++)
3387         {
3388           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3389           int map = -1;
3390
3391           /* TODO: handle non-NOPs when merging.  */
3392           if (jfunc->type == IPA_JF_PASS_THROUGH)
3393             {
3394               if (ipa_get_jf_pass_through_operation (jfunc) == NOP_EXPR)
3395                 map = ipa_get_jf_pass_through_formal_id (jfunc);
3396               if (!ipa_get_jf_pass_through_agg_preserved (jfunc))
3397                 offset_map[i] = -1;
3398             }
3399           else if (jfunc->type == IPA_JF_ANCESTOR)
3400             {
3401               HOST_WIDE_INT offset = ipa_get_jf_ancestor_offset (jfunc);
3402               if (offset >= 0 && offset < INT_MAX)
3403                 {
3404                   map = ipa_get_jf_ancestor_formal_id (jfunc);
3405                   if (!ipa_get_jf_ancestor_agg_preserved (jfunc))
3406                     offset = -1;
3407                   offset_map[i] = offset;
3408                 }
3409             }
3410           operand_map[i] = map;
3411           gcc_assert (map < ipa_get_param_count (IPA_NODE_REF (to)));
3412         }
3413     }
3414   for (i = 0; vec_safe_iterate (callee_info->entry, i, &e); i++)
3415     {
3416       struct predicate p = remap_predicate (info, callee_info,
3417                                             &e->predicate, operand_map,
3418                                             offset_map, clause,
3419                                             &toplev_predicate);
3420       if (!false_predicate_p (&p))
3421         {
3422           gcov_type add_time = ((gcov_type) e->time * edge->frequency
3423                                 + CGRAPH_FREQ_BASE / 2) / CGRAPH_FREQ_BASE;
3424           int prob = predicate_probability (callee_info->conds,
3425                                             &e->predicate,
3426                                             clause, es->param);
3427           add_time = apply_probability ((gcov_type) add_time, prob);
3428           if (add_time > MAX_TIME * INLINE_TIME_SCALE)
3429             add_time = MAX_TIME * INLINE_TIME_SCALE;
3430           if (prob != REG_BR_PROB_BASE
3431               && dump_file && (dump_flags & TDF_DETAILS))
3432             {
3433               fprintf (dump_file, "\t\tScaling time by probability:%f\n",
3434                        (double) prob / REG_BR_PROB_BASE);
3435             }
3436           account_size_time (info, e->size, add_time, &p);
3437         }
3438     }
3439   remap_edge_summaries (edge, edge->callee, info, callee_info, operand_map,
3440                         offset_map, clause, &toplev_predicate);
3441   remap_hint_predicate (info, callee_info,
3442                         &callee_info->loop_iterations,
3443                         operand_map, offset_map, clause, &toplev_predicate);
3444   remap_hint_predicate (info, callee_info,
3445                         &callee_info->loop_stride,
3446                         operand_map, offset_map, clause, &toplev_predicate);
3447   remap_hint_predicate (info, callee_info,
3448                         &callee_info->array_index,
3449                         operand_map, offset_map, clause, &toplev_predicate);
3450
3451   inline_update_callee_summaries (edge->callee,
3452                                   inline_edge_summary (edge)->loop_depth);
3453
3454   /* We do not maintain predicates of inlined edges, free it.  */
3455   edge_set_predicate (edge, &true_p);
3456   /* Similarly remove param summaries.  */
3457   es->param.release ();
3458   operand_map.release ();
3459   offset_map.release ();
3460 }
3461
3462 /* For performance reasons inline_merge_summary is not updating overall size
3463    and time.  Recompute it.  */
3464
3465 void
3466 inline_update_overall_summary (struct cgraph_node *node)
3467 {
3468   struct inline_summary *info = inline_summary (node);
3469   size_time_entry *e;
3470   int i;
3471
3472   info->size = 0;
3473   info->time = 0;
3474   for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
3475     {
3476       info->size += e->size, info->time += e->time;
3477       if (info->time > MAX_TIME * INLINE_TIME_SCALE)
3478         info->time = MAX_TIME * INLINE_TIME_SCALE;
3479     }
3480   estimate_calls_size_and_time (node, &info->size, &info->time, NULL,
3481                                 ~(clause_t) (1 << predicate_false_condition),
3482                                 vNULL, vNULL, vNULL);
3483   info->time = (info->time + INLINE_TIME_SCALE / 2) / INLINE_TIME_SCALE;
3484   info->size = (info->size + INLINE_SIZE_SCALE / 2) / INLINE_SIZE_SCALE;
3485 }
3486
3487 /* Return hints derrived from EDGE.   */
3488 int
3489 simple_edge_hints (struct cgraph_edge *edge)
3490 {
3491   int hints = 0;
3492   struct cgraph_node *to = (edge->caller->global.inlined_to
3493                             ? edge->caller->global.inlined_to : edge->caller);
3494   if (inline_summary (to)->scc_no
3495       && inline_summary (to)->scc_no == inline_summary (edge->callee)->scc_no
3496       && !cgraph_edge_recursive_p (edge))
3497     hints |= INLINE_HINT_same_scc;
3498
3499   if (to->symbol.lto_file_data && edge->callee->symbol.lto_file_data
3500       && to->symbol.lto_file_data != edge->callee->symbol.lto_file_data)
3501     hints |= INLINE_HINT_cross_module;
3502
3503   return hints;
3504 }
3505
3506 /* Estimate the time cost for the caller when inlining EDGE.
3507    Only to be called via estimate_edge_time, that handles the
3508    caching mechanism.
3509
3510    When caching, also update the cache entry.  Compute both time and
3511    size, since we always need both metrics eventually.  */
3512
3513 int
3514 do_estimate_edge_time (struct cgraph_edge *edge)
3515 {
3516   int time;
3517   int size;
3518   inline_hints hints;
3519   struct cgraph_node *callee;
3520   clause_t clause;
3521   vec<tree> known_vals;
3522   vec<tree> known_binfos;
3523   vec<ipa_agg_jump_function_p> known_aggs;
3524   struct inline_edge_summary *es = inline_edge_summary (edge);
3525
3526   callee = cgraph_function_or_thunk_node (edge->callee, NULL);
3527
3528   gcc_checking_assert (edge->inline_failed);
3529   evaluate_properties_for_edge (edge, true,
3530                                 &clause, &known_vals, &known_binfos,
3531                                 &known_aggs);
3532   estimate_node_size_and_time (callee, clause, known_vals, known_binfos,
3533                                known_aggs, &size, &time, &hints, es->param);
3534   known_vals.release ();
3535   known_binfos.release ();
3536   known_aggs.release ();
3537   gcc_checking_assert (size >= 0);
3538   gcc_checking_assert (time >= 0);
3539
3540   /* When caching, update the cache entry.  */
3541   if (edge_growth_cache.exists ())
3542     {
3543       if ((int) edge_growth_cache.length () <= edge->uid)
3544         edge_growth_cache.safe_grow_cleared (cgraph_edge_max_uid);
3545       edge_growth_cache[edge->uid].time = time + (time >= 0);
3546
3547       edge_growth_cache[edge->uid].size = size + (size >= 0);
3548       hints |= simple_edge_hints (edge);
3549       edge_growth_cache[edge->uid].hints = hints + 1;
3550     }
3551   return time;
3552 }
3553
3554
3555 /* Return estimated callee growth after inlining EDGE.
3556    Only to be called via estimate_edge_size.  */
3557
3558 int
3559 do_estimate_edge_size (struct cgraph_edge *edge)
3560 {
3561   int size;
3562   struct cgraph_node *callee;
3563   clause_t clause;
3564   vec<tree> known_vals;
3565   vec<tree> known_binfos;
3566   vec<ipa_agg_jump_function_p> known_aggs;
3567
3568   /* When we do caching, use do_estimate_edge_time to populate the entry.  */
3569
3570   if (edge_growth_cache.exists ())
3571     {
3572       do_estimate_edge_time (edge);
3573       size = edge_growth_cache[edge->uid].size;
3574       gcc_checking_assert (size);
3575       return size - (size > 0);
3576     }
3577
3578   callee = cgraph_function_or_thunk_node (edge->callee, NULL);
3579
3580   /* Early inliner runs without caching, go ahead and do the dirty work.  */
3581   gcc_checking_assert (edge->inline_failed);
3582   evaluate_properties_for_edge (edge, true,
3583                                 &clause, &known_vals, &known_binfos,
3584                                 &known_aggs);
3585   estimate_node_size_and_time (callee, clause, known_vals, known_binfos,
3586                                known_aggs, &size, NULL, NULL, vNULL);
3587   known_vals.release ();
3588   known_binfos.release ();
3589   known_aggs.release ();
3590   return size;
3591 }
3592
3593
3594 /* Estimate the growth of the caller when inlining EDGE.
3595    Only to be called via estimate_edge_size.  */
3596
3597 inline_hints
3598 do_estimate_edge_hints (struct cgraph_edge *edge)
3599 {
3600   inline_hints hints;
3601   struct cgraph_node *callee;
3602   clause_t clause;
3603   vec<tree> known_vals;
3604   vec<tree> known_binfos;
3605   vec<ipa_agg_jump_function_p> known_aggs;
3606
3607   /* When we do caching, use do_estimate_edge_time to populate the entry.  */
3608
3609   if (edge_growth_cache.exists ())
3610     {
3611       do_estimate_edge_time (edge);
3612       hints = edge_growth_cache[edge->uid].hints;
3613       gcc_checking_assert (hints);
3614       return hints - 1;
3615     }
3616
3617   callee = cgraph_function_or_thunk_node (edge->callee, NULL);
3618
3619   /* Early inliner runs without caching, go ahead and do the dirty work.  */
3620   gcc_checking_assert (edge->inline_failed);
3621   evaluate_properties_for_edge (edge, true,
3622                                 &clause, &known_vals, &known_binfos,
3623                                 &known_aggs);
3624   estimate_node_size_and_time (callee, clause, known_vals, known_binfos,
3625                                known_aggs, NULL, NULL, &hints, vNULL);
3626   known_vals.release ();
3627   known_binfos.release ();
3628   known_aggs.release ();
3629   hints |= simple_edge_hints (edge);
3630   return hints;
3631 }
3632
3633
3634 /* Estimate self time of the function NODE after inlining EDGE.  */
3635
3636 int
3637 estimate_time_after_inlining (struct cgraph_node *node,
3638                               struct cgraph_edge *edge)
3639 {
3640   struct inline_edge_summary *es = inline_edge_summary (edge);
3641   if (!es->predicate || !false_predicate_p (es->predicate))
3642     {
3643       gcov_type time =
3644         inline_summary (node)->time + estimate_edge_time (edge);
3645       if (time < 0)
3646         time = 0;
3647       if (time > MAX_TIME)
3648         time = MAX_TIME;
3649       return time;
3650     }
3651   return inline_summary (node)->time;
3652 }
3653
3654
3655 /* Estimate the size of NODE after inlining EDGE which should be an
3656    edge to either NODE or a call inlined into NODE.  */
3657
3658 int
3659 estimate_size_after_inlining (struct cgraph_node *node,
3660                               struct cgraph_edge *edge)
3661 {
3662   struct inline_edge_summary *es = inline_edge_summary (edge);
3663   if (!es->predicate || !false_predicate_p (es->predicate))
3664     {
3665       int size = inline_summary (node)->size + estimate_edge_growth (edge);
3666       gcc_assert (size >= 0);
3667       return size;
3668     }
3669   return inline_summary (node)->size;
3670 }
3671
3672
3673 struct growth_data
3674 {
3675   struct cgraph_node *node;
3676   bool self_recursive;
3677   int growth;
3678 };
3679
3680
3681 /* Worker for do_estimate_growth.  Collect growth for all callers.  */
3682
3683 static bool
3684 do_estimate_growth_1 (struct cgraph_node *node, void *data)
3685 {
3686   struct cgraph_edge *e;
3687   struct growth_data *d = (struct growth_data *) data;
3688
3689   for (e = node->callers; e; e = e->next_caller)
3690     {
3691       gcc_checking_assert (e->inline_failed);
3692
3693       if (e->caller == d->node
3694           || (e->caller->global.inlined_to
3695               && e->caller->global.inlined_to == d->node))
3696         d->self_recursive = true;
3697       d->growth += estimate_edge_growth (e);
3698     }
3699   return false;
3700 }
3701
3702
3703 /* Estimate the growth caused by inlining NODE into all callees.  */
3704
3705 int
3706 do_estimate_growth (struct cgraph_node *node)
3707 {
3708   struct growth_data d = { node, 0, false };
3709   struct inline_summary *info = inline_summary (node);
3710
3711   cgraph_for_node_and_aliases (node, do_estimate_growth_1, &d, true);
3712
3713   /* For self recursive functions the growth estimation really should be
3714      infinity.  We don't want to return very large values because the growth
3715      plays various roles in badness computation fractions.  Be sure to not
3716      return zero or negative growths. */
3717   if (d.self_recursive)
3718     d.growth = d.growth < info->size ? info->size : d.growth;
3719   else if (DECL_EXTERNAL (node->symbol.decl))
3720     ;
3721   else
3722     {
3723       if (cgraph_will_be_removed_from_program_if_no_direct_calls (node))
3724         d.growth -= info->size;
3725       /* COMDAT functions are very often not shared across multiple units
3726          since they come from various template instantiations.
3727          Take this into account.  */
3728       else if (DECL_COMDAT (node->symbol.decl)
3729                && cgraph_can_remove_if_no_direct_calls_p (node))
3730         d.growth -= (info->size
3731                      * (100 - PARAM_VALUE (PARAM_COMDAT_SHARING_PROBABILITY))
3732                      + 50) / 100;
3733     }
3734
3735   if (node_growth_cache.exists ())
3736     {
3737       if ((int) node_growth_cache.length () <= node->uid)
3738         node_growth_cache.safe_grow_cleared (cgraph_max_uid);
3739       node_growth_cache[node->uid] = d.growth + (d.growth >= 0);
3740     }
3741   return d.growth;
3742 }
3743
3744
3745 /* This function performs intraprocedural analysis in NODE that is required to
3746    inline indirect calls.  */
3747
3748 static void
3749 inline_indirect_intraprocedural_analysis (struct cgraph_node *node)
3750 {
3751   ipa_analyze_node (node);
3752   if (dump_file && (dump_flags & TDF_DETAILS))
3753     {
3754       ipa_print_node_params (dump_file, node);
3755       ipa_print_node_jump_functions (dump_file, node);
3756     }
3757 }
3758
3759
3760 /* Note function body size.  */
3761
3762 static void
3763 inline_analyze_function (struct cgraph_node *node)
3764 {
3765   push_cfun (DECL_STRUCT_FUNCTION (node->symbol.decl));
3766
3767   if (dump_file)
3768     fprintf (dump_file, "\nAnalyzing function: %s/%u\n",
3769              cgraph_node_name (node), node->symbol.order);
3770   if (optimize && !node->thunk.thunk_p)
3771     inline_indirect_intraprocedural_analysis (node);
3772   compute_inline_parameters (node, false);
3773   if (!optimize)
3774     {
3775       struct cgraph_edge *e;
3776       for (e = node->callees; e; e = e->next_callee)
3777         {
3778           if (e->inline_failed == CIF_FUNCTION_NOT_CONSIDERED)
3779             e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
3780           e->call_stmt_cannot_inline_p = true;
3781         }
3782       for (e = node->indirect_calls; e; e = e->next_callee)
3783         {
3784           if (e->inline_failed == CIF_FUNCTION_NOT_CONSIDERED)
3785             e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
3786           e->call_stmt_cannot_inline_p = true;
3787         }
3788     }
3789
3790   pop_cfun ();
3791 }
3792
3793
3794 /* Called when new function is inserted to callgraph late.  */
3795
3796 static void
3797 add_new_function (struct cgraph_node *node, void *data ATTRIBUTE_UNUSED)
3798 {
3799   inline_analyze_function (node);
3800 }
3801
3802
3803 /* Note function body size.  */
3804
3805 void
3806 inline_generate_summary (void)
3807 {
3808   struct cgraph_node *node;
3809
3810   /* When not optimizing, do not bother to analyze.  Inlining is still done
3811      because edge redirection needs to happen there.  */
3812   if (!optimize && !flag_lto && !flag_wpa)
3813     return;
3814
3815   function_insertion_hook_holder =
3816     cgraph_add_function_insertion_hook (&add_new_function, NULL);
3817
3818   ipa_register_cgraph_hooks ();
3819   inline_free_summary ();
3820
3821   FOR_EACH_DEFINED_FUNCTION (node)
3822     if (!node->symbol.alias)
3823       inline_analyze_function (node);
3824 }
3825
3826
3827 /* Read predicate from IB.  */
3828
3829 static struct predicate
3830 read_predicate (struct lto_input_block *ib)
3831 {
3832   struct predicate out;
3833   clause_t clause;
3834   int k = 0;
3835
3836   do
3837     {
3838       gcc_assert (k <= MAX_CLAUSES);
3839       clause = out.clause[k++] = streamer_read_uhwi (ib);
3840     }
3841   while (clause);
3842
3843   /* Zero-initialize the remaining clauses in OUT.  */
3844   while (k <= MAX_CLAUSES)
3845     out.clause[k++] = 0;
3846
3847   return out;
3848 }
3849
3850
3851 /* Write inline summary for edge E to OB.  */
3852
3853 static void
3854 read_inline_edge_summary (struct lto_input_block *ib, struct cgraph_edge *e)
3855 {
3856   struct inline_edge_summary *es = inline_edge_summary (e);
3857   struct predicate p;
3858   int length, i;
3859
3860   es->call_stmt_size = streamer_read_uhwi (ib);
3861   es->call_stmt_time = streamer_read_uhwi (ib);
3862   es->loop_depth = streamer_read_uhwi (ib);
3863   p = read_predicate (ib);
3864   edge_set_predicate (e, &p);
3865   length = streamer_read_uhwi (ib);
3866   if (length)
3867     {
3868       es->param.safe_grow_cleared (length);
3869       for (i = 0; i < length; i++)
3870         es->param[i].change_prob = streamer_read_uhwi (ib);
3871     }
3872 }
3873
3874
3875 /* Stream in inline summaries from the section.  */
3876
3877 static void
3878 inline_read_section (struct lto_file_decl_data *file_data, const char *data,
3879                      size_t len)
3880 {
3881   const struct lto_function_header *header =
3882     (const struct lto_function_header *) data;
3883   const int cfg_offset = sizeof (struct lto_function_header);
3884   const int main_offset = cfg_offset + header->cfg_size;
3885   const int string_offset = main_offset + header->main_size;
3886   struct data_in *data_in;
3887   struct lto_input_block ib;
3888   unsigned int i, count2, j;
3889   unsigned int f_count;
3890
3891   LTO_INIT_INPUT_BLOCK (ib, (const char *) data + main_offset, 0,
3892                         header->main_size);
3893
3894   data_in =
3895     lto_data_in_create (file_data, (const char *) data + string_offset,
3896                         header->string_size, vNULL);
3897   f_count = streamer_read_uhwi (&ib);
3898   for (i = 0; i < f_count; i++)
3899     {
3900       unsigned int index;
3901       struct cgraph_node *node;
3902       struct inline_summary *info;
3903       lto_symtab_encoder_t encoder;
3904       struct bitpack_d bp;
3905       struct cgraph_edge *e;
3906       predicate p;
3907
3908       index = streamer_read_uhwi (&ib);
3909       encoder = file_data->symtab_node_encoder;
3910       node = cgraph (lto_symtab_encoder_deref (encoder, index));
3911       info = inline_summary (node);
3912
3913       info->estimated_stack_size
3914         = info->estimated_self_stack_size = streamer_read_uhwi (&ib);
3915       info->size = info->self_size = streamer_read_uhwi (&ib);
3916       info->time = info->self_time = streamer_read_uhwi (&ib);
3917
3918       bp = streamer_read_bitpack (&ib);
3919       info->inlinable = bp_unpack_value (&bp, 1);
3920
3921       count2 = streamer_read_uhwi (&ib);
3922       gcc_assert (!info->conds);
3923       for (j = 0; j < count2; j++)
3924         {
3925           struct condition c;
3926           c.operand_num = streamer_read_uhwi (&ib);
3927           c.code = (enum tree_code) streamer_read_uhwi (&ib);
3928           c.val = stream_read_tree (&ib, data_in);
3929           bp = streamer_read_bitpack (&ib);
3930           c.agg_contents = bp_unpack_value (&bp, 1);
3931           c.by_ref = bp_unpack_value (&bp, 1);
3932           if (c.agg_contents)
3933             c.offset = streamer_read_uhwi (&ib);
3934           vec_safe_push (info->conds, c);
3935         }
3936       count2 = streamer_read_uhwi (&ib);
3937       gcc_assert (!info->entry);
3938       for (j = 0; j < count2; j++)
3939         {
3940           struct size_time_entry e;
3941
3942           e.size = streamer_read_uhwi (&ib);
3943           e.time = streamer_read_uhwi (&ib);
3944           e.predicate = read_predicate (&ib);
3945
3946           vec_safe_push (info->entry, e);
3947         }
3948
3949       p = read_predicate (&ib);
3950       set_hint_predicate (&info->loop_iterations, p);
3951       p = read_predicate (&ib);
3952       set_hint_predicate (&info->loop_stride, p);
3953       p = read_predicate (&ib);
3954       set_hint_predicate (&info->array_index, p);
3955       for (e = node->callees; e; e = e->next_callee)
3956         read_inline_edge_summary (&ib, e);
3957       for (e = node->indirect_calls; e; e = e->next_callee)
3958         read_inline_edge_summary (&ib, e);
3959     }
3960
3961   lto_free_section_data (file_data, LTO_section_inline_summary, NULL, data,
3962                          len);
3963   lto_data_in_delete (data_in);
3964 }
3965
3966
3967 /* Read inline summary.  Jump functions are shared among ipa-cp
3968    and inliner, so when ipa-cp is active, we don't need to write them
3969    twice.  */
3970
3971 void
3972 inline_read_summary (void)
3973 {
3974   struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
3975   struct lto_file_decl_data *file_data;
3976   unsigned int j = 0;
3977
3978   inline_summary_alloc ();
3979
3980   while ((file_data = file_data_vec[j++]))
3981     {
3982       size_t len;
3983       const char *data = lto_get_section_data (file_data,
3984                                                LTO_section_inline_summary,
3985                                                NULL, &len);
3986       if (data)
3987         inline_read_section (file_data, data, len);
3988       else
3989         /* Fatal error here.  We do not want to support compiling ltrans units
3990            with different version of compiler or different flags than the WPA
3991            unit, so this should never happen.  */
3992         fatal_error ("ipa inline summary is missing in input file");
3993     }
3994   if (optimize)
3995     {
3996       ipa_register_cgraph_hooks ();
3997       if (!flag_ipa_cp)
3998         ipa_prop_read_jump_functions ();
3999     }
4000   function_insertion_hook_holder =
4001     cgraph_add_function_insertion_hook (&add_new_function, NULL);
4002 }
4003
4004
4005 /* Write predicate P to OB.  */
4006
4007 static void
4008 write_predicate (struct output_block *ob, struct predicate *p)
4009 {
4010   int j;
4011   if (p)
4012     for (j = 0; p->clause[j]; j++)
4013       {
4014         gcc_assert (j < MAX_CLAUSES);
4015         streamer_write_uhwi (ob, p->clause[j]);
4016       }
4017   streamer_write_uhwi (ob, 0);
4018 }
4019
4020
4021 /* Write inline summary for edge E to OB.  */
4022
4023 static void
4024 write_inline_edge_summary (struct output_block *ob, struct cgraph_edge *e)
4025 {
4026   struct inline_edge_summary *es = inline_edge_summary (e);
4027   int i;
4028
4029   streamer_write_uhwi (ob, es->call_stmt_size);
4030   streamer_write_uhwi (ob, es->call_stmt_time);
4031   streamer_write_uhwi (ob, es->loop_depth);
4032   write_predicate (ob, es->predicate);
4033   streamer_write_uhwi (ob, es->param.length ());
4034   for (i = 0; i < (int) es->param.length (); i++)
4035     streamer_write_uhwi (ob, es->param[i].change_prob);
4036 }
4037
4038
4039 /* Write inline summary for node in SET.
4040    Jump functions are shared among ipa-cp and inliner, so when ipa-cp is
4041    active, we don't need to write them twice.  */
4042
4043 void
4044 inline_write_summary (void)
4045 {
4046   struct cgraph_node *node;
4047   struct output_block *ob = create_output_block (LTO_section_inline_summary);
4048   lto_symtab_encoder_t encoder = ob->decl_state->symtab_node_encoder;
4049   unsigned int count = 0;
4050   int i;
4051
4052   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4053     {
4054       symtab_node snode = lto_symtab_encoder_deref (encoder, i);
4055       cgraph_node *cnode = dyn_cast <cgraph_node> (snode);
4056       if (cnode && cnode->symbol.definition && !cnode->symbol.alias)
4057         count++;
4058     }
4059   streamer_write_uhwi (ob, count);
4060
4061   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4062     {
4063       symtab_node snode = lto_symtab_encoder_deref (encoder, i);
4064       cgraph_node *cnode = dyn_cast <cgraph_node> (snode);
4065       if (cnode && (node = cnode)->symbol.definition && !node->symbol.alias)
4066         {
4067           struct inline_summary *info = inline_summary (node);
4068           struct bitpack_d bp;
4069           struct cgraph_edge *edge;
4070           int i;
4071           size_time_entry *e;
4072           struct condition *c;
4073
4074           streamer_write_uhwi (ob,
4075                                lto_symtab_encoder_encode (encoder,
4076                                                           (symtab_node)
4077                                                           node));
4078           streamer_write_hwi (ob, info->estimated_self_stack_size);
4079           streamer_write_hwi (ob, info->self_size);
4080           streamer_write_hwi (ob, info->self_time);
4081           bp = bitpack_create (ob->main_stream);
4082           bp_pack_value (&bp, info->inlinable, 1);
4083           streamer_write_bitpack (&bp);
4084           streamer_write_uhwi (ob, vec_safe_length (info->conds));
4085           for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
4086             {
4087               streamer_write_uhwi (ob, c->operand_num);
4088               streamer_write_uhwi (ob, c->code);
4089               stream_write_tree (ob, c->val, true);
4090               bp = bitpack_create (ob->main_stream);
4091               bp_pack_value (&bp, c->agg_contents, 1);
4092               bp_pack_value (&bp, c->by_ref, 1);
4093               streamer_write_bitpack (&bp);
4094               if (c->agg_contents)
4095                 streamer_write_uhwi (ob, c->offset);
4096             }
4097           streamer_write_uhwi (ob, vec_safe_length (info->entry));
4098           for (i = 0; vec_safe_iterate (info->entry, i, &e); i++)
4099             {
4100               streamer_write_uhwi (ob, e->size);
4101               streamer_write_uhwi (ob, e->time);
4102               write_predicate (ob, &e->predicate);
4103             }
4104           write_predicate (ob, info->loop_iterations);
4105           write_predicate (ob, info->loop_stride);
4106           write_predicate (ob, info->array_index);
4107           for (edge = node->callees; edge; edge = edge->next_callee)
4108             write_inline_edge_summary (ob, edge);
4109           for (edge = node->indirect_calls; edge; edge = edge->next_callee)
4110             write_inline_edge_summary (ob, edge);
4111         }
4112     }
4113   streamer_write_char_stream (ob->main_stream, 0);
4114   produce_asm (ob, NULL);
4115   destroy_output_block (ob);
4116
4117   if (optimize && !flag_ipa_cp)
4118     ipa_prop_write_jump_functions ();
4119 }
4120
4121
4122 /* Release inline summary.  */
4123
4124 void
4125 inline_free_summary (void)
4126 {
4127   struct cgraph_node *node;
4128   if (!inline_edge_summary_vec.exists ())
4129     return;
4130   FOR_EACH_DEFINED_FUNCTION (node)
4131     reset_inline_summary (node);
4132   if (function_insertion_hook_holder)
4133     cgraph_remove_function_insertion_hook (function_insertion_hook_holder);
4134   function_insertion_hook_holder = NULL;
4135   if (node_removal_hook_holder)
4136     cgraph_remove_node_removal_hook (node_removal_hook_holder);
4137   node_removal_hook_holder = NULL;
4138   if (edge_removal_hook_holder)
4139     cgraph_remove_edge_removal_hook (edge_removal_hook_holder);
4140   edge_removal_hook_holder = NULL;
4141   if (node_duplication_hook_holder)
4142     cgraph_remove_node_duplication_hook (node_duplication_hook_holder);
4143   node_duplication_hook_holder = NULL;
4144   if (edge_duplication_hook_holder)
4145     cgraph_remove_edge_duplication_hook (edge_duplication_hook_holder);
4146   edge_duplication_hook_holder = NULL;
4147   vec_free (inline_summary_vec);
4148   inline_edge_summary_vec.release ();
4149   if (edge_predicate_pool)
4150     free_alloc_pool (edge_predicate_pool);
4151   edge_predicate_pool = 0;
4152 }