gcc/ipa-fnsummary.c

   1 /* Function summary pass.
   2    Copyright (C) 2003-2019 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* Analysis of function bodies used by inter-procedural passes
  22
  23    We estimate for each function
  24      - function body size and size after specializing into given context
  25      - average function execution time in a given context
  26      - function frame size
  27    For each call
  28      - call statement size, time and how often the parameters change
  29
  30    ipa_fn_summary data structures store above information locally (i.e.
  31    parameters of the function itself) and globally (i.e. parameters of
  32    the function created by applying all the inline decisions already
  33    present in the callgraph).
  34
  35    We provide access to the ipa_fn_summary data structure and
  36    basic logic updating the parameters when inlining is performed.
  37
  38    The summaries are context sensitive.  Context means
  39      1) partial assignment of known constant values of operands
  40      2) whether function is inlined into the call or not.
  41    It is easy to add more variants.  To represent function size and time
  42    that depends on context (i.e. it is known to be optimized away when
  43    context is known either by inlining or from IP-CP and cloning),
  44    we use predicates.
  45
  46    estimate_edge_size_and_time can be used to query
  47    function size/time in the given context.  ipa_merge_fn_summary_after_inlining merges
  48    properties of caller and callee after inlining.
  49
  50    Finally pass_inline_parameters is exported.  This is used to drive
  51    computation of function parameters used by the early inliner. IPA
  52    inlined performs analysis via its analyze_function method. */
  53
  54 #include "config.h"
  55 #include "system.h"
  56 #include "coretypes.h"
  57 #include "backend.h"
  58 #include "tree.h"
  59 #include "gimple.h"
  60 #include "alloc-pool.h"
  61 #include "tree-pass.h"
  62 #include "ssa.h"
  63 #include "tree-streamer.h"
  64 #include "cgraph.h"
  65 #include "diagnostic.h"
  66 #include "fold-const.h"
  67 #include "print-tree.h"
  68 #include "tree-inline.h"
  69 #include "gimple-pretty-print.h"
  70 #include "cfganal.h"
  71 #include "gimple-iterator.h"
  72 #include "tree-cfg.h"
  73 #include "tree-ssa-loop-niter.h"
  74 #include "tree-ssa-loop.h"
  75 #include "symbol-summary.h"
  76 #include "ipa-prop.h"
  77 #include "ipa-fnsummary.h"
  78 #include "cfgloop.h"
  79 #include "tree-scalar-evolution.h"
  80 #include "ipa-utils.h"
  81 #include "cfgexpand.h"
  82 #include "gimplify.h"
  83 #include "stringpool.h"
  84 #include "attribs.h"
  85
  86 /* Summaries.  */
  87 fast_function_summary <ipa_fn_summary *, va_gc> *ipa_fn_summaries;
  88 fast_function_summary <ipa_size_summary *, va_heap> *ipa_size_summaries;
  89 fast_call_summary <ipa_call_summary *, va_heap> *ipa_call_summaries;
  90
  91 /* Edge predicates goes here.  */
  92 static object_allocator<predicate> edge_predicate_pool ("edge predicates");
  93
  94
  95 /* Dump IPA hints.  */
  96 void
  97 ipa_dump_hints (FILE *f, ipa_hints hints)
  98 {
  99   if (!hints)
 100     return;
 101   fprintf (f, "IPA hints:");
 102   if (hints & INLINE_HINT_indirect_call)
 103     {
 104       hints &= ~INLINE_HINT_indirect_call;
 105       fprintf (f, " indirect_call");
 106     }
 107   if (hints & INLINE_HINT_loop_iterations)
 108     {
 109       hints &= ~INLINE_HINT_loop_iterations;
 110       fprintf (f, " loop_iterations");
 111     }
 112   if (hints & INLINE_HINT_loop_stride)
 113     {
 114       hints &= ~INLINE_HINT_loop_stride;
 115       fprintf (f, " loop_stride");
 116     }
 117   if (hints & INLINE_HINT_same_scc)
 118     {
 119       hints &= ~INLINE_HINT_same_scc;
 120       fprintf (f, " same_scc");
 121     }
 122   if (hints & INLINE_HINT_in_scc)
 123     {
 124       hints &= ~INLINE_HINT_in_scc;
 125       fprintf (f, " in_scc");
 126     }
 127   if (hints & INLINE_HINT_cross_module)
 128     {
 129       hints &= ~INLINE_HINT_cross_module;
 130       fprintf (f, " cross_module");
 131     }
 132   if (hints & INLINE_HINT_declared_inline)
 133     {
 134       hints &= ~INLINE_HINT_declared_inline;
 135       fprintf (f, " declared_inline");
 136     }
 137   if (hints & INLINE_HINT_known_hot)
 138     {
 139       hints &= ~INLINE_HINT_known_hot;
 140       fprintf (f, " known_hot");
 141     }
 142   gcc_assert (!hints);
 143 }
 144
 145
 146 /* Record SIZE and TIME to SUMMARY.
 147    The accounted code will be executed when EXEC_PRED is true.
 148    When NONCONST_PRED is false the code will evaulate to constant and
 149    will get optimized out in specialized clones of the function.   */
 150
 151 void
 152 ipa_fn_summary::account_size_time (int size, sreal time,
 153                                    const predicate &exec_pred,
 154                                    const predicate &nonconst_pred_in)
 155 {
 156   size_time_entry *e;
 157   bool found = false;
 158   int i;
 159   predicate nonconst_pred;
 160
 161   if (exec_pred == false)
 162     return;
 163
 164   nonconst_pred = nonconst_pred_in & exec_pred;
 165
 166   if (nonconst_pred == false)
 167     return;
 168
 169   /* We need to create initial empty unconitional clause, but otherwie
 170      we don't need to account empty times and sizes.  */
 171   if (!size && time == 0 && size_time_table)
 172     return;
 173
 174   gcc_assert (time >= 0);
 175
 176   for (i = 0; vec_safe_iterate (size_time_table, i, &e); i++)
 177     if (e->exec_predicate == exec_pred
 178         && e->nonconst_predicate == nonconst_pred)
 179       {
 180         found = true;
 181         break;
 182       }
 183   if (i == 256)
 184     {
 185       i = 0;
 186       found = true;
 187       e = &(*size_time_table)[0];
 188       if (dump_file && (dump_flags & TDF_DETAILS))
 189         fprintf (dump_file,
 190                  "\t\tReached limit on number of entries, "
 191                  "ignoring the predicate.");
 192     }
 193   if (dump_file && (dump_flags & TDF_DETAILS) && (time != 0 || size))
 194     {
 195       fprintf (dump_file,
 196                "\t\tAccounting size:%3.2f, time:%3.2f on %spredicate exec:",
 197                ((double) size) / ipa_fn_summary::size_scale,
 198                (time.to_double ()), found ? "" : "new ");
 199       exec_pred.dump (dump_file, conds, 0);
 200       if (exec_pred != nonconst_pred)
 201         {
 202           fprintf (dump_file, " nonconst:");
 203           nonconst_pred.dump (dump_file, conds);
 204         }
 205       else
 206         fprintf (dump_file, "\n");
 207     }
 208   if (!found)
 209     {
 210       class size_time_entry new_entry;
 211       new_entry.size = size;
 212       new_entry.time = time;
 213       new_entry.exec_predicate = exec_pred;
 214       new_entry.nonconst_predicate = nonconst_pred;
 215       vec_safe_push (size_time_table, new_entry);
 216     }
 217   else
 218     {
 219       e->size += size;
 220       e->time += time;
 221     }
 222 }
 223
 224 /* We proved E to be unreachable, redirect it to __bultin_unreachable.  */
 225
 226 static struct cgraph_edge *
 227 redirect_to_unreachable (struct cgraph_edge *e)
 228 {
 229   struct cgraph_node *callee = !e->inline_failed ? e->callee : NULL;
 230   struct cgraph_node *target = cgraph_node::get_create
 231                       (builtin_decl_implicit (BUILT_IN_UNREACHABLE));
 232
 233   if (e->speculative)
 234     e = e->resolve_speculation (target->decl);
 235   else if (!e->callee)
 236     e->make_direct (target);
 237   else
 238     e->redirect_callee (target);
 239   class ipa_call_summary *es = ipa_call_summaries->get (e);
 240   e->inline_failed = CIF_UNREACHABLE;
 241   e->count = profile_count::zero ();
 242   es->call_stmt_size = 0;
 243   es->call_stmt_time = 0;
 244   if (callee)
 245     callee->remove_symbol_and_inline_clones ();
 246   return e;
 247 }
 248
 249 /* Set predicate for edge E.  */
 250
 251 static void
 252 edge_set_predicate (struct cgraph_edge *e, predicate *predicate)
 253 {
 254   /* If the edge is determined to be never executed, redirect it
 255      to BUILTIN_UNREACHABLE to make it clear to IPA passes the call will
 256      be optimized out.  */
 257   if (predicate && *predicate == false
 258       /* When handling speculative edges, we need to do the redirection
 259          just once.  Do it always on the direct edge, so we do not
 260          attempt to resolve speculation while duplicating the edge.  */
 261       && (!e->speculative || e->callee))
 262     e = redirect_to_unreachable (e);
 263
 264   class ipa_call_summary *es = ipa_call_summaries->get (e);
 265   if (predicate && *predicate != true)
 266     {
 267       if (!es->predicate)
 268         es->predicate = edge_predicate_pool.allocate ();
 269       *es->predicate = *predicate;
 270     }
 271   else
 272     {
 273       if (es->predicate)
 274         edge_predicate_pool.remove (es->predicate);
 275       es->predicate = NULL;
 276     }
 277 }
 278
 279 /* Set predicate for hint *P.  */
 280
 281 static void
 282 set_hint_predicate (predicate **p, predicate new_predicate)
 283 {
 284   if (new_predicate == false || new_predicate == true)
 285     {
 286       if (*p)
 287         edge_predicate_pool.remove (*p);
 288       *p = NULL;
 289     }
 290   else
 291     {
 292       if (!*p)
 293         *p = edge_predicate_pool.allocate ();
 294       **p = new_predicate;
 295     }
 296 }
 297
 298
 299 /* Compute what conditions may or may not hold given invormation about
 300    parameters.  RET_CLAUSE returns truths that may hold in a specialized copy,
 301    whie RET_NONSPEC_CLAUSE returns truths that may hold in an nonspecialized
 302    copy when called in a given context.  It is a bitmask of conditions. Bit
 303    0 means that condition is known to be false, while bit 1 means that condition
 304    may or may not be true.  These differs - for example NOT_INLINED condition
 305    is always false in the second and also builtin_constant_p tests cannot use
 306    the fact that parameter is indeed a constant.
 307
 308    KNOWN_VALS is partial mapping of parameters of NODE to constant values.
 309    KNOWN_AGGS is a vector of aggreggate known offset/value set for each
 310    parameter.  Return clause of possible truths.  When INLINE_P is true, assume
 311    that we are inlining.
 312
 313    ERROR_MARK means compile time invariant.  */
 314
 315 static void
 316 evaluate_conditions_for_known_args (struct cgraph_node *node,
 317                                     bool inline_p,
 318                                     vec<tree> known_vals,
 319                                     vec<value_range> known_value_ranges,
 320                                     vec<ipa_agg_value_set> known_aggs,
 321                                     clause_t *ret_clause,
 322                                     clause_t *ret_nonspec_clause)
 323 {
 324   clause_t clause = inline_p ? 0 : 1 << predicate::not_inlined_condition;
 325   clause_t nonspec_clause = 1 << predicate::not_inlined_condition;
 326   class ipa_fn_summary *info = ipa_fn_summaries->get (node);
 327   int i;
 328   struct condition *c;
 329
 330   for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
 331     {
 332       tree val;
 333       tree res;
 334       int j;
 335       struct expr_eval_op *op;
 336
 337       /* We allow call stmt to have fewer arguments than the callee function
 338          (especially for K&R style programs).  So bound check here (we assume
 339          known_aggs vector, if non-NULL, has the same length as
 340          known_vals).  */
 341       gcc_checking_assert (!known_aggs.exists ()
 342                            || (known_vals.length () == known_aggs.length ()));
 343       if (c->operand_num >= (int) known_vals.length ())
 344         {
 345           clause |= 1 << (i + predicate::first_dynamic_condition);
 346           nonspec_clause |= 1 << (i + predicate::first_dynamic_condition);
 347           continue;
 348         }
 349
 350       if (c->agg_contents)
 351         {
 352           struct ipa_agg_value_set *agg;
 353
 354           if (c->code == predicate::changed
 355               && !c->by_ref
 356               && (known_vals[c->operand_num] == error_mark_node))
 357             continue;
 358
 359           if (known_aggs.exists ())
 360             {
 361               agg = &known_aggs[c->operand_num];
 362               val = ipa_find_agg_cst_for_param (agg, known_vals[c->operand_num],
 363                                                 c->offset, c->by_ref);
 364             }
 365           else
 366             val = NULL_TREE;
 367         }
 368       else
 369         {
 370           val = known_vals[c->operand_num];
 371           if (val == error_mark_node && c->code != predicate::changed)
 372             val = NULL_TREE;
 373         }
 374
 375       if (!val
 376           && (c->code == predicate::changed
 377               || c->code == predicate::is_not_constant))
 378         {
 379           clause |= 1 << (i + predicate::first_dynamic_condition);
 380           nonspec_clause |= 1 << (i + predicate::first_dynamic_condition);
 381           continue;
 382         }
 383       if (c->code == predicate::changed)
 384         {
 385           nonspec_clause |= 1 << (i + predicate::first_dynamic_condition);
 386           continue;
 387         }
 388
 389       if (c->code == predicate::is_not_constant)
 390         {
 391           nonspec_clause |= 1 << (i + predicate::first_dynamic_condition);
 392           continue;
 393         }
 394
 395       if (val && TYPE_SIZE (c->type) == TYPE_SIZE (TREE_TYPE (val)))
 396         {
 397           if (c->type != TREE_TYPE (val))
 398             val = fold_unary (VIEW_CONVERT_EXPR, c->type, val);
 399           for (j = 0; vec_safe_iterate (c->param_ops, j, &op); j++)
 400             {
 401               if (!val)
 402                 break;
 403               if (!op->val[0])
 404                 val = fold_unary (op->code, op->type, val);
 405               else if (!op->val[1])
 406                 val = fold_binary (op->code, op->type,
 407                                    op->index ? op->val[0] : val,
 408                                    op->index ? val : op->val[0]);
 409               else if (op->index == 0)
 410                 val = fold_ternary (op->code, op->type,
 411                                     val, op->val[0], op->val[1]);
 412               else if (op->index == 1)
 413                 val = fold_ternary (op->code, op->type,
 414                                     op->val[0], val, op->val[1]);
 415               else if (op->index == 2)
 416                 val = fold_ternary (op->code, op->type,
 417                                     op->val[0], op->val[1], val);
 418               else
 419                 val = NULL_TREE;
 420             }
 421
 422           res = val
 423             ? fold_binary_to_constant (c->code, boolean_type_node, val, c->val)
 424             : NULL;
 425
 426           if (res && integer_zerop (res))
 427             continue;
 428           if (res && integer_onep (res))
 429             {
 430               clause |= 1 << (i + predicate::first_dynamic_condition);
 431               nonspec_clause |= 1 << (i + predicate::first_dynamic_condition);
 432               continue;
 433             }
 434         }
 435       if (c->operand_num < (int) known_value_ranges.length ()
 436           && !c->agg_contents
 437           && !known_value_ranges[c->operand_num].undefined_p ()
 438           && !known_value_ranges[c->operand_num].varying_p ()
 439           && TYPE_SIZE (c->type)
 440                  == TYPE_SIZE (known_value_ranges[c->operand_num].type ())
 441           && (!val || TREE_CODE (val) != INTEGER_CST))
 442         {
 443           value_range vr = known_value_ranges[c->operand_num];
 444           if (!useless_type_conversion_p (c->type, vr.type ()))
 445             {
 446               value_range res;
 447               range_fold_unary_expr (&res, NOP_EXPR,
 448                                      c->type, &vr, vr.type ());
 449               vr = res;
 450             }
 451           tree type = c->type;
 452
 453           for (j = 0; vec_safe_iterate (c->param_ops, j, &op); j++)
 454             {
 455               if (vr.varying_p () || vr.undefined_p ())
 456                 break;
 457
 458               value_range res;
 459               if (!op->val[0])
 460                 range_fold_unary_expr (&res, op->code, op->type, &vr, type);
 461               else if (!op->val[1])
 462                 {
 463                   value_range op0 (op->val[0], op->val[0]);
 464                   range_fold_binary_expr (&res, op->code, op->type,
 465                                           op->index ? &op0 : &vr,
 466                                           op->index ? &vr : &op0);
 467                 }
 468               else
 469                 gcc_unreachable ();
 470               type = op->type;
 471               vr = res;
 472             }
 473           if (!vr.varying_p () && !vr.undefined_p ())
 474             {
 475               value_range res;
 476               value_range val_vr (c->val, c->val);
 477               range_fold_binary_expr (&res, c->code, boolean_type_node,
 478                                       &vr,
 479                                       &val_vr);
 480               if (res.zero_p ())
 481                 continue;
 482             }
 483         }
 484
 485       clause |= 1 << (i + predicate::first_dynamic_condition);
 486       nonspec_clause |= 1 << (i + predicate::first_dynamic_condition);
 487     }
 488   *ret_clause = clause;
 489   if (ret_nonspec_clause)
 490     *ret_nonspec_clause = nonspec_clause;
 491 }
 492
 493
 494 /* Work out what conditions might be true at invocation of E.  */
 495
 496 void
 497 evaluate_properties_for_edge (struct cgraph_edge *e, bool inline_p,
 498                               clause_t *clause_ptr,
 499                               clause_t *nonspec_clause_ptr,
 500                               vec<tree> *known_vals_ptr,
 501                               vec<ipa_polymorphic_call_context>
 502                               *known_contexts_ptr,
 503                               vec<ipa_agg_value_set> *known_aggs_ptr)
 504 {
 505   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 506   class ipa_fn_summary *info = ipa_fn_summaries->get (callee);
 507   vec<tree> known_vals = vNULL;
 508   auto_vec<value_range, 32> known_value_ranges;
 509   vec<ipa_agg_value_set> known_aggs = vNULL;
 510   class ipa_edge_args *args;
 511
 512   if (clause_ptr)
 513     *clause_ptr = inline_p ? 0 : 1 << predicate::not_inlined_condition;
 514   if (known_vals_ptr)
 515     known_vals_ptr->create (0);
 516   if (known_contexts_ptr)
 517     known_contexts_ptr->create (0);
 518
 519   if (ipa_node_params_sum
 520       && !e->call_stmt_cannot_inline_p
 521       && ((clause_ptr && info->conds) || known_vals_ptr || known_contexts_ptr)
 522       && (args = IPA_EDGE_REF (e)) != NULL)
 523     {
 524       struct cgraph_node *caller;
 525       class ipa_node_params *caller_parms_info, *callee_pi;
 526       class ipa_call_summary *es = ipa_call_summaries->get (e);
 527       int i, count = ipa_get_cs_argument_count (args);
 528
 529       if (e->caller->inlined_to)
 530         caller = e->caller->inlined_to;
 531       else
 532         caller = e->caller;
 533       caller_parms_info = IPA_NODE_REF (caller);
 534       callee_pi = IPA_NODE_REF (callee);
 535
 536       if (count && (info->conds || known_vals_ptr))
 537         known_vals.safe_grow_cleared (count);
 538       if (count && info->conds)
 539         known_value_ranges.safe_grow_cleared (count);
 540       if (count && (info->conds || known_aggs_ptr))
 541         known_aggs.safe_grow_cleared (count);
 542       if (count && known_contexts_ptr)
 543         known_contexts_ptr->safe_grow_cleared (count);
 544
 545       if (callee_pi)
 546         for (i = 0; i < count; i++)
 547           {
 548             struct ipa_jump_func *jf = ipa_get_ith_jump_func (args, i);
 549             tree cst = ipa_value_from_jfunc (caller_parms_info, jf,
 550                                              ipa_get_type (callee_pi, i));
 551
 552             if (!cst && e->call_stmt
 553                 && i < (int)gimple_call_num_args (e->call_stmt))
 554               {
 555                 cst = gimple_call_arg (e->call_stmt, i);
 556                 if (!is_gimple_min_invariant (cst))
 557                   cst = NULL;
 558               }
 559             if (cst)
 560               {
 561                 gcc_checking_assert (TREE_CODE (cst) != TREE_BINFO);
 562                 if (known_vals.exists ())
 563                   known_vals[i] = cst;
 564               }
 565             else if (inline_p && !es->param[i].change_prob)
 566               known_vals[i] = error_mark_node;
 567
 568             if (known_contexts_ptr)
 569               (*known_contexts_ptr)[i]
 570                 = ipa_context_from_jfunc (caller_parms_info, e, i, jf);
 571
 572             known_aggs[i] = ipa_agg_value_set_from_jfunc (caller_parms_info,
 573                                                           caller, &jf->agg);
 574             if (info->conds)
 575               known_value_ranges[i]
 576                 = ipa_value_range_from_jfunc (caller_parms_info, e, jf,
 577                                               ipa_get_type (callee_pi, i));
 578           }
 579         else
 580           gcc_assert (callee->thunk.thunk_p);
 581     }
 582   else if (e->call_stmt && !e->call_stmt_cannot_inline_p
 583            && ((clause_ptr && info->conds) || known_vals_ptr))
 584     {
 585       int i, count = (int)gimple_call_num_args (e->call_stmt);
 586
 587       if (count && (info->conds || known_vals_ptr))
 588         known_vals.safe_grow_cleared (count);
 589       for (i = 0; i < count; i++)
 590         {
 591           tree cst = gimple_call_arg (e->call_stmt, i);
 592           if (!is_gimple_min_invariant (cst))
 593             cst = NULL;
 594           if (cst)
 595             known_vals[i] = cst;
 596         }
 597     }
 598
 599   evaluate_conditions_for_known_args (callee, inline_p,
 600                                       known_vals,
 601                                       known_value_ranges,
 602                                       known_aggs, clause_ptr,
 603                                       nonspec_clause_ptr);
 604
 605   if (known_vals_ptr)
 606     *known_vals_ptr = known_vals;
 607   else
 608     known_vals.release ();
 609
 610   if (known_aggs_ptr)
 611     *known_aggs_ptr = known_aggs;
 612   else
 613     ipa_release_agg_values (known_aggs);
 614 }
 615
 616
 617 /* Allocate the function summary. */
 618
 619 static void
 620 ipa_fn_summary_alloc (void)
 621 {
 622   gcc_checking_assert (!ipa_fn_summaries);
 623   ipa_size_summaries = new fast_function_summary <ipa_size_summary *, va_heap>
 624                                                          (symtab);
 625   ipa_fn_summaries = ipa_fn_summary_t::create_ggc (symtab);
 626   ipa_call_summaries = new ipa_call_summary_t (symtab);
 627 }
 628
 629 ipa_call_summary::~ipa_call_summary ()
 630 {
 631   if (predicate)
 632     edge_predicate_pool.remove (predicate);
 633
 634   param.release ();
 635 }
 636
 637 ipa_fn_summary::~ipa_fn_summary ()
 638 {
 639   if (loop_iterations)
 640     edge_predicate_pool.remove (loop_iterations);
 641   if (loop_stride)
 642     edge_predicate_pool.remove (loop_stride);
 643   vec_free (conds);
 644   vec_free (size_time_table);
 645 }
 646
 647 void
 648 ipa_fn_summary_t::remove_callees (cgraph_node *node)
 649 {
 650   cgraph_edge *e;
 651   for (e = node->callees; e; e = e->next_callee)
 652     ipa_call_summaries->remove (e);
 653   for (e = node->indirect_calls; e; e = e->next_callee)
 654     ipa_call_summaries->remove (e);
 655 }
 656
 657 /* Same as remap_predicate_after_duplication but handle hint predicate *P.
 658    Additionally care about allocating new memory slot for updated predicate
 659    and set it to NULL when it becomes true or false (and thus uninteresting).
 660  */
 661
 662 static void
 663 remap_hint_predicate_after_duplication (predicate **p,
 664                                         clause_t possible_truths)
 665 {
 666   predicate new_predicate;
 667
 668   if (!*p)
 669     return;
 670
 671   new_predicate = (*p)->remap_after_duplication (possible_truths);
 672   /* We do not want to free previous predicate; it is used by node origin.  */
 673   *p = NULL;
 674   set_hint_predicate (p, new_predicate);
 675 }
 676
 677
 678 /* Hook that is called by cgraph.c when a node is duplicated.  */
 679 void
 680 ipa_fn_summary_t::duplicate (cgraph_node *src,
 681                              cgraph_node *dst,
 682                              ipa_fn_summary *,
 683                              ipa_fn_summary *info)
 684 {
 685   new (info) ipa_fn_summary (*ipa_fn_summaries->get (src));
 686   /* TODO: as an optimization, we may avoid copying conditions
 687      that are known to be false or true.  */
 688   info->conds = vec_safe_copy (info->conds);
 689
 690   /* When there are any replacements in the function body, see if we can figure
 691      out that something was optimized out.  */
 692   if (ipa_node_params_sum && dst->clone.tree_map)
 693     {
 694       vec<size_time_entry, va_gc> *entry = info->size_time_table;
 695       /* Use SRC parm info since it may not be copied yet.  */
 696       class ipa_node_params *parms_info = IPA_NODE_REF (src);
 697       vec<tree> known_vals = vNULL;
 698       int count = ipa_get_param_count (parms_info);
 699       int i, j;
 700       clause_t possible_truths;
 701       predicate true_pred = true;
 702       size_time_entry *e;
 703       int optimized_out_size = 0;
 704       bool inlined_to_p = false;
 705       struct cgraph_edge *edge, *next;
 706
 707       info->size_time_table = 0;
 708       known_vals.safe_grow_cleared (count);
 709       for (i = 0; i < count; i++)
 710         {
 711           struct ipa_replace_map *r;
 712
 713           for (j = 0; vec_safe_iterate (dst->clone.tree_map, j, &r); j++)
 714             {
 715               if (r->parm_num == i)
 716                 {
 717                   known_vals[i] = r->new_tree;
 718                   break;
 719                 }
 720             }
 721         }
 722       evaluate_conditions_for_known_args (dst, false,
 723                                           known_vals,
 724                                           vNULL,
 725                                           vNULL,
 726                                           &possible_truths,
 727                                           /* We are going to specialize,
 728                                              so ignore nonspec truths.  */
 729                                           NULL);
 730       known_vals.release ();
 731
 732       info->account_size_time (0, 0, true_pred, true_pred);
 733
 734       /* Remap size_time vectors.
 735          Simplify the predicate by prunning out alternatives that are known
 736          to be false.
 737          TODO: as on optimization, we can also eliminate conditions known
 738          to be true.  */
 739       for (i = 0; vec_safe_iterate (entry, i, &e); i++)
 740         {
 741           predicate new_exec_pred;
 742           predicate new_nonconst_pred;
 743           new_exec_pred = e->exec_predicate.remap_after_duplication
 744                                  (possible_truths);
 745           new_nonconst_pred = e->nonconst_predicate.remap_after_duplication
 746                                  (possible_truths);
 747           if (new_exec_pred == false || new_nonconst_pred == false)
 748             optimized_out_size += e->size;
 749           else
 750             info->account_size_time (e->size, e->time, new_exec_pred,
 751                                      new_nonconst_pred);
 752         }
 753
 754       /* Remap edge predicates with the same simplification as above.
 755          Also copy constantness arrays.   */
 756       for (edge = dst->callees; edge; edge = next)
 757         {
 758           predicate new_predicate;
 759           class ipa_call_summary *es = ipa_call_summaries->get (edge);
 760           next = edge->next_callee;
 761
 762           if (!edge->inline_failed)
 763             inlined_to_p = true;
 764           if (!es->predicate)
 765             continue;
 766           new_predicate = es->predicate->remap_after_duplication
 767             (possible_truths);
 768           if (new_predicate == false && *es->predicate != false)
 769             optimized_out_size += es->call_stmt_size * ipa_fn_summary::size_scale;
 770           edge_set_predicate (edge, &new_predicate);
 771         }
 772
 773       /* Remap indirect edge predicates with the same simplificaiton as above.
 774          Also copy constantness arrays.   */
 775       for (edge = dst->indirect_calls; edge; edge = next)
 776         {
 777           predicate new_predicate;
 778           class ipa_call_summary *es = ipa_call_summaries->get (edge);
 779           next = edge->next_callee;
 780
 781           gcc_checking_assert (edge->inline_failed);
 782           if (!es->predicate)
 783             continue;
 784           new_predicate = es->predicate->remap_after_duplication
 785                                  (possible_truths);
 786           if (new_predicate == false && *es->predicate != false)
 787             optimized_out_size += es->call_stmt_size * ipa_fn_summary::size_scale;
 788           edge_set_predicate (edge, &new_predicate);
 789         }
 790       remap_hint_predicate_after_duplication (&info->loop_iterations,
 791                                               possible_truths);
 792       remap_hint_predicate_after_duplication (&info->loop_stride,
 793                                               possible_truths);
 794
 795       /* If inliner or someone after inliner will ever start producing
 796          non-trivial clones, we will get trouble with lack of information
 797          about updating self sizes, because size vectors already contains
 798          sizes of the calees.  */
 799       gcc_assert (!inlined_to_p || !optimized_out_size);
 800     }
 801   else
 802     {
 803       info->size_time_table = vec_safe_copy (info->size_time_table);
 804       if (info->loop_iterations)
 805         {
 806           predicate p = *info->loop_iterations;
 807           info->loop_iterations = NULL;
 808           set_hint_predicate (&info->loop_iterations, p);
 809         }
 810       if (info->loop_stride)
 811         {
 812           predicate p = *info->loop_stride;
 813           info->loop_stride = NULL;
 814           set_hint_predicate (&info->loop_stride, p);
 815         }
 816     }
 817   if (!dst->inlined_to)
 818     ipa_update_overall_fn_summary (dst);
 819 }
 820
 821
 822 /* Hook that is called by cgraph.c when a node is duplicated.  */
 823
 824 void
 825 ipa_call_summary_t::duplicate (struct cgraph_edge *src,
 826                                struct cgraph_edge *dst,
 827                                class ipa_call_summary *srcinfo,
 828                                class ipa_call_summary *info)
 829 {
 830   new (info) ipa_call_summary (*srcinfo);
 831   info->predicate = NULL;
 832   edge_set_predicate (dst, srcinfo->predicate);
 833   info->param = srcinfo->param.copy ();
 834   if (!dst->indirect_unknown_callee && src->indirect_unknown_callee)
 835     {
 836       info->call_stmt_size -= (eni_size_weights.indirect_call_cost
 837                                - eni_size_weights.call_cost);
 838       info->call_stmt_time -= (eni_time_weights.indirect_call_cost
 839                                - eni_time_weights.call_cost);
 840     }
 841 }
 842
 843 /* Dump edge summaries associated to NODE and recursively to all clones.
 844    Indent by INDENT.  */
 845
 846 static void
 847 dump_ipa_call_summary (FILE *f, int indent, struct cgraph_node *node,
 848                        class ipa_fn_summary *info)
 849 {
 850   struct cgraph_edge *edge;
 851   for (edge = node->callees; edge; edge = edge->next_callee)
 852     {
 853       class ipa_call_summary *es = ipa_call_summaries->get (edge);
 854       struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
 855       int i;
 856
 857       fprintf (f,
 858                "%*s%s/%i %s\n%*s  freq:%4.2f",
 859                indent, "", callee->name (), callee->order,
 860                !edge->inline_failed
 861                ? "inlined" : cgraph_inline_failed_string (edge-> inline_failed),
 862                indent, "", edge->sreal_frequency ().to_double ());
 863
 864       if (es)
 865         fprintf (f, " loop depth:%2i size:%2i time: %2i",
 866                  es->loop_depth, es->call_stmt_size, es->call_stmt_time);
 867
 868       ipa_fn_summary *s = ipa_fn_summaries->get (callee);
 869       ipa_size_summary *ss = ipa_size_summaries->get (callee);
 870       if (s != NULL)
 871         fprintf (f, " callee size:%2i stack:%2i",
 872                  (int) (ss->size / ipa_fn_summary::size_scale),
 873                  (int) s->estimated_stack_size);
 874
 875       if (es && es->predicate)
 876         {
 877           fprintf (f, " predicate: ");
 878           es->predicate->dump (f, info->conds);
 879         }
 880       else
 881         fprintf (f, "\n");
 882       if (es && es->param.exists ())
 883         for (i = 0; i < (int) es->param.length (); i++)
 884           {
 885             int prob = es->param[i].change_prob;
 886
 887             if (!prob)
 888               fprintf (f, "%*s op%i is compile time invariant\n",
 889                        indent + 2, "", i);
 890             else if (prob != REG_BR_PROB_BASE)
 891               fprintf (f, "%*s op%i change %f%% of time\n", indent + 2, "", i,
 892                        prob * 100.0 / REG_BR_PROB_BASE);
 893           }
 894       if (!edge->inline_failed)
 895         {
 896           ipa_size_summary *ss = ipa_size_summaries->get (callee);
 897           fprintf (f, "%*sStack frame offset %i, callee self size %i\n",
 898                    indent + 2, "",
 899                    (int) ipa_get_stack_frame_offset (callee),
 900                    (int) ss->estimated_self_stack_size);
 901           dump_ipa_call_summary (f, indent + 2, callee, info);
 902         }
 903     }
 904   for (edge = node->indirect_calls; edge; edge = edge->next_callee)
 905     {
 906       class ipa_call_summary *es = ipa_call_summaries->get (edge);
 907       fprintf (f, "%*sindirect call loop depth:%2i freq:%4.2f size:%2i"
 908                " time: %2i",
 909                indent, "",
 910                es->loop_depth,
 911                edge->sreal_frequency ().to_double (), es->call_stmt_size,
 912                es->call_stmt_time);
 913       if (es->predicate)
 914         {
 915           fprintf (f, "predicate: ");
 916           es->predicate->dump (f, info->conds);
 917         }
 918       else
 919         fprintf (f, "\n");
 920     }
 921 }
 922
 923
 924 void
 925 ipa_dump_fn_summary (FILE *f, struct cgraph_node *node)
 926 {
 927   if (node->definition)
 928     {
 929       class ipa_fn_summary *s = ipa_fn_summaries->get (node);
 930       class ipa_size_summary *ss = ipa_size_summaries->get (node);
 931       if (s != NULL)
 932         {
 933           size_time_entry *e;
 934           int i;
 935           fprintf (f, "IPA function summary for %s", node->dump_name ());
 936           if (DECL_DISREGARD_INLINE_LIMITS (node->decl))
 937             fprintf (f, " always_inline");
 938           if (s->inlinable)
 939             fprintf (f, " inlinable");
 940           if (s->fp_expressions)
 941             fprintf (f, " fp_expression");
 942           fprintf (f, "\n  global time:     %f\n", s->time.to_double ());
 943           fprintf (f, "  self size:       %i\n", ss->self_size);
 944           fprintf (f, "  global size:     %i\n", ss->size);
 945           fprintf (f, "  min size:       %i\n", s->min_size);
 946           fprintf (f, "  self stack:      %i\n",
 947                    (int) ss->estimated_self_stack_size);
 948           fprintf (f, "  global stack:    %i\n", (int) s->estimated_stack_size);
 949           if (s->growth)
 950             fprintf (f, "  estimated growth:%i\n", (int) s->growth);
 951           if (s->scc_no)
 952             fprintf (f, "  In SCC:          %i\n", (int) s->scc_no);
 953           for (i = 0; vec_safe_iterate (s->size_time_table, i, &e); i++)
 954             {
 955               fprintf (f, "    size:%f, time:%f",
 956                        (double) e->size / ipa_fn_summary::size_scale,
 957                        e->time.to_double ());
 958               if (e->exec_predicate != true)
 959                 {
 960                   fprintf (f, ",  executed if:");
 961                   e->exec_predicate.dump (f, s->conds, 0);
 962                 }
 963               if (e->exec_predicate != e->nonconst_predicate)
 964                 {
 965                   fprintf (f, ",  nonconst if:");
 966                   e->nonconst_predicate.dump (f, s->conds, 0);
 967                 }
 968               fprintf (f, "\n");
 969             }
 970           if (s->loop_iterations)
 971             {
 972               fprintf (f, "  loop iterations:");
 973               s->loop_iterations->dump (f, s->conds);
 974             }
 975           if (s->loop_stride)
 976             {
 977               fprintf (f, "  loop stride:");
 978               s->loop_stride->dump (f, s->conds);
 979             }
 980           fprintf (f, "  calls:\n");
 981           dump_ipa_call_summary (f, 4, node, s);
 982           fprintf (f, "\n");
 983         }
 984       else
 985         fprintf (f, "IPA summary for %s is missing.\n", node->dump_name ());
 986     }
 987 }
 988
 989 DEBUG_FUNCTION void
 990 ipa_debug_fn_summary (struct cgraph_node *node)
 991 {
 992   ipa_dump_fn_summary (stderr, node);
 993 }
 994
 995 void
 996 ipa_dump_fn_summaries (FILE *f)
 997 {
 998   struct cgraph_node *node;
 999
1000   FOR_EACH_DEFINED_FUNCTION (node)
1001     if (!node->inlined_to)
1002       ipa_dump_fn_summary (f, node);
1003 }
1004
1005 /* Callback of walk_aliased_vdefs.  Flags that it has been invoked to the
1006    boolean variable pointed to by DATA.  */
1007
1008 static bool
1009 mark_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef ATTRIBUTE_UNUSED,
1010                void *data)
1011 {
1012   bool *b = (bool *) data;
1013   *b = true;
1014   return true;
1015 }
1016
1017 /* If OP refers to value of function parameter, return the corresponding
1018    parameter.  If non-NULL, the size of the memory load (or the SSA_NAME of the
1019    PARM_DECL) will be stored to *SIZE_P in that case too.  */
1020
1021 static tree
1022 unmodified_parm_1 (ipa_func_body_info *fbi, gimple *stmt, tree op,
1023                    poly_int64 *size_p)
1024 {
1025   /* SSA_NAME referring to parm default def?  */
1026   if (TREE_CODE (op) == SSA_NAME
1027       && SSA_NAME_IS_DEFAULT_DEF (op)
1028       && TREE_CODE (SSA_NAME_VAR (op)) == PARM_DECL)
1029     {
1030       if (size_p)
1031         *size_p = tree_to_poly_int64 (TYPE_SIZE (TREE_TYPE (op)));
1032       return SSA_NAME_VAR (op);
1033     }
1034   /* Non-SSA parm reference?  */
1035   if (TREE_CODE (op) == PARM_DECL)
1036     {
1037       bool modified = false;
1038
1039       ao_ref refd;
1040       ao_ref_init (&refd, op);
1041       int walked = walk_aliased_vdefs (&refd, gimple_vuse (stmt),
1042                                        mark_modified, &modified, NULL, NULL,
1043                                        fbi->aa_walk_budget + 1);
1044       if (walked < 0)
1045         {
1046           fbi->aa_walk_budget = 0;
1047           return NULL_TREE;
1048         }
1049       if (!modified)
1050         {
1051           if (size_p)
1052             *size_p = tree_to_poly_int64 (TYPE_SIZE (TREE_TYPE (op)));
1053           return op;
1054         }
1055     }
1056   return NULL_TREE;
1057 }
1058
1059 /* If OP refers to value of function parameter, return the corresponding
1060    parameter.  Also traverse chains of SSA register assignments.  If non-NULL,
1061    the size of the memory load (or the SSA_NAME of the PARM_DECL) will be
1062    stored to *SIZE_P in that case too.  */
1063
1064 static tree
1065 unmodified_parm (ipa_func_body_info *fbi, gimple *stmt, tree op,
1066                  poly_int64 *size_p)
1067 {
1068   tree res = unmodified_parm_1 (fbi, stmt, op, size_p);
1069   if (res)
1070     return res;
1071
1072   if (TREE_CODE (op) == SSA_NAME
1073       && !SSA_NAME_IS_DEFAULT_DEF (op)
1074       && gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1075     return unmodified_parm (fbi, SSA_NAME_DEF_STMT (op),
1076                             gimple_assign_rhs1 (SSA_NAME_DEF_STMT (op)),
1077                             size_p);
1078   return NULL_TREE;
1079 }
1080
1081 /* If OP refers to a value of a function parameter or value loaded from an
1082    aggregate passed to a parameter (either by value or reference), return TRUE
1083    and store the number of the parameter to *INDEX_P, the access size into
1084    *SIZE_P, and information whether and how it has been loaded from an
1085    aggregate into *AGGPOS.  INFO describes the function parameters, STMT is the
1086    statement in which OP is used or loaded.  */
1087
1088 static bool
1089 unmodified_parm_or_parm_agg_item (struct ipa_func_body_info *fbi,
1090                                   gimple *stmt, tree op, int *index_p,
1091                                   poly_int64 *size_p,
1092                                   struct agg_position_info *aggpos)
1093 {
1094   tree res = unmodified_parm_1 (fbi, stmt, op, size_p);
1095
1096   gcc_checking_assert (aggpos);
1097   if (res)
1098     {
1099       *index_p = ipa_get_param_decl_index (fbi->info, res);
1100       if (*index_p < 0)
1101         return false;
1102       aggpos->agg_contents = false;
1103       aggpos->by_ref = false;
1104       return true;
1105     }
1106
1107   if (TREE_CODE (op) == SSA_NAME)
1108     {
1109       if (SSA_NAME_IS_DEFAULT_DEF (op)
1110           || !gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1111         return false;
1112       stmt = SSA_NAME_DEF_STMT (op);
1113       op = gimple_assign_rhs1 (stmt);
1114       if (!REFERENCE_CLASS_P (op))
1115         return unmodified_parm_or_parm_agg_item (fbi, stmt, op, index_p, size_p,
1116                                                  aggpos);
1117     }
1118
1119   aggpos->agg_contents = true;
1120   return ipa_load_from_parm_agg (fbi, fbi->info->descriptors,
1121                                  stmt, op, index_p, &aggpos->offset,
1122                                  size_p, &aggpos->by_ref);
1123 }
1124
1125 /* See if statement might disappear after inlining.
1126    0 - means not eliminated
1127    1 - half of statements goes away
1128    2 - for sure it is eliminated.
1129    We are not terribly sophisticated, basically looking for simple abstraction
1130    penalty wrappers.  */
1131
1132 static int
1133 eliminated_by_inlining_prob (ipa_func_body_info *fbi, gimple *stmt)
1134 {
1135   enum gimple_code code = gimple_code (stmt);
1136   enum tree_code rhs_code;
1137
1138   if (!optimize)
1139     return 0;
1140
1141   switch (code)
1142     {
1143     case GIMPLE_RETURN:
1144       return 2;
1145     case GIMPLE_ASSIGN:
1146       if (gimple_num_ops (stmt) != 2)
1147         return 0;
1148
1149       rhs_code = gimple_assign_rhs_code (stmt);
1150
1151       /* Casts of parameters, loads from parameters passed by reference
1152          and stores to return value or parameters are often free after
1153          inlining dua to SRA and further combining.
1154          Assume that half of statements goes away.  */
1155       if (CONVERT_EXPR_CODE_P (rhs_code)
1156           || rhs_code == VIEW_CONVERT_EXPR
1157           || rhs_code == ADDR_EXPR
1158           || gimple_assign_rhs_class (stmt) == GIMPLE_SINGLE_RHS)
1159         {
1160           tree rhs = gimple_assign_rhs1 (stmt);
1161           tree lhs = gimple_assign_lhs (stmt);
1162           tree inner_rhs = get_base_address (rhs);
1163           tree inner_lhs = get_base_address (lhs);
1164           bool rhs_free = false;
1165           bool lhs_free = false;
1166
1167           if (!inner_rhs)
1168             inner_rhs = rhs;
1169           if (!inner_lhs)
1170             inner_lhs = lhs;
1171
1172           /* Reads of parameter are expected to be free.  */
1173           if (unmodified_parm (fbi, stmt, inner_rhs, NULL))
1174             rhs_free = true;
1175           /* Match expressions of form &this->field. Those will most likely
1176              combine with something upstream after inlining.  */
1177           else if (TREE_CODE (inner_rhs) == ADDR_EXPR)
1178             {
1179               tree op = get_base_address (TREE_OPERAND (inner_rhs, 0));
1180               if (TREE_CODE (op) == PARM_DECL)
1181                 rhs_free = true;
1182               else if (TREE_CODE (op) == MEM_REF
1183                        && unmodified_parm (fbi, stmt, TREE_OPERAND (op, 0),
1184                                            NULL))
1185                 rhs_free = true;
1186             }
1187
1188           /* When parameter is not SSA register because its address is taken
1189              and it is just copied into one, the statement will be completely
1190              free after inlining (we will copy propagate backward).   */
1191           if (rhs_free && is_gimple_reg (lhs))
1192             return 2;
1193
1194           /* Reads of parameters passed by reference
1195              expected to be free (i.e. optimized out after inlining).  */
1196           if (TREE_CODE (inner_rhs) == MEM_REF
1197               && unmodified_parm (fbi, stmt, TREE_OPERAND (inner_rhs, 0), NULL))
1198             rhs_free = true;
1199
1200           /* Copying parameter passed by reference into gimple register is
1201              probably also going to copy propagate, but we can't be quite
1202              sure.  */
1203           if (rhs_free && is_gimple_reg (lhs))
1204             lhs_free = true;
1205
1206           /* Writes to parameters, parameters passed by value and return value
1207              (either dirrectly or passed via invisible reference) are free.
1208
1209              TODO: We ought to handle testcase like
1210              struct a {int a,b;};
1211              struct a
1212              retrurnsturct (void)
1213              {
1214              struct a a ={1,2};
1215              return a;
1216              }
1217
1218              This translate into:
1219
1220              retrurnsturct ()
1221              {
1222              int a$b;
1223              int a$a;
1224              struct a a;
1225              struct a D.2739;
1226
1227              <bb 2>:
1228              D.2739.a = 1;
1229              D.2739.b = 2;
1230              return D.2739;
1231
1232              }
1233              For that we either need to copy ipa-split logic detecting writes
1234              to return value.  */
1235           if (TREE_CODE (inner_lhs) == PARM_DECL
1236               || TREE_CODE (inner_lhs) == RESULT_DECL
1237               || (TREE_CODE (inner_lhs) == MEM_REF
1238                   && (unmodified_parm (fbi, stmt, TREE_OPERAND (inner_lhs, 0),
1239                                        NULL)
1240                       || (TREE_CODE (TREE_OPERAND (inner_lhs, 0)) == SSA_NAME
1241                           && SSA_NAME_VAR (TREE_OPERAND (inner_lhs, 0))
1242                           && TREE_CODE (SSA_NAME_VAR (TREE_OPERAND
1243                                                       (inner_lhs,
1244                                                        0))) == RESULT_DECL))))
1245             lhs_free = true;
1246           if (lhs_free
1247               && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
1248             rhs_free = true;
1249           if (lhs_free && rhs_free)
1250             return 1;
1251         }
1252       return 0;
1253     default:
1254       return 0;
1255     }
1256 }
1257
1258 /* Analyze EXPR if it represents a series of simple operations performed on
1259    a function parameter and return true if so.  FBI, STMT, EXPR, INDEX_P and
1260    AGGPOS have the same meaning like in unmodified_parm_or_parm_agg_item.
1261    Type of the parameter or load from an aggregate via the parameter is
1262    stored in *TYPE_P.  Operations on the parameter are recorded to
1263    PARAM_OPS_P if it is not NULL.  */
1264
1265 static bool
1266 decompose_param_expr (struct ipa_func_body_info *fbi,
1267                       gimple *stmt, tree expr,
1268                       int *index_p, tree *type_p,
1269                       struct agg_position_info *aggpos,
1270                       expr_eval_ops *param_ops_p = NULL)
1271 {
1272   int op_limit = param_ipa_max_param_expr_ops;
1273   int op_count = 0;
1274
1275   if (param_ops_p)
1276     *param_ops_p = NULL;
1277
1278   while (true)
1279     {
1280       expr_eval_op eval_op;
1281       unsigned rhs_count;
1282       unsigned cst_count = 0;
1283
1284       if (unmodified_parm_or_parm_agg_item (fbi, stmt, expr, index_p, NULL,
1285                                             aggpos))
1286         {
1287           tree type = TREE_TYPE (expr);
1288
1289           if (aggpos->agg_contents)
1290             {
1291               /* Stop if containing bit-field.  */
1292               if (TREE_CODE (expr) == BIT_FIELD_REF
1293                   || contains_bitfld_component_ref_p (expr))
1294                 break;
1295             }
1296
1297           *type_p = type;
1298           return true;
1299         }
1300
1301       if (TREE_CODE (expr) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (expr))
1302         break;
1303
1304       if (!is_gimple_assign (stmt = SSA_NAME_DEF_STMT (expr)))
1305         break;
1306
1307       switch (gimple_assign_rhs_class (stmt))
1308         {
1309         case GIMPLE_SINGLE_RHS:
1310           expr = gimple_assign_rhs1 (stmt);
1311           continue;
1312
1313         case GIMPLE_UNARY_RHS:
1314           rhs_count = 1;
1315           break;
1316
1317         case GIMPLE_BINARY_RHS:
1318           rhs_count = 2;
1319           break;
1320
1321         case GIMPLE_TERNARY_RHS:
1322           rhs_count = 3;
1323           break;
1324
1325         default:
1326           goto fail;
1327         }
1328
1329       /* Stop if expression is too complex.  */
1330       if (op_count++ == op_limit)
1331         break;
1332
1333       if (param_ops_p)
1334         {
1335           eval_op.code = gimple_assign_rhs_code (stmt);
1336           eval_op.type = TREE_TYPE (gimple_assign_lhs (stmt));
1337           eval_op.val[0] = NULL_TREE;
1338           eval_op.val[1] = NULL_TREE;
1339         }
1340
1341       expr = NULL_TREE;
1342       for (unsigned i = 0; i < rhs_count; i++)
1343         {
1344           tree op = gimple_op (stmt, i + 1);
1345
1346           gcc_assert (op && !TYPE_P (op));
1347           if (is_gimple_ip_invariant (op))
1348             {
1349               if (++cst_count == rhs_count)
1350                 goto fail;
1351
1352               eval_op.val[cst_count - 1] = op;
1353             }
1354           else if (!expr)
1355             {
1356               /* Found a non-constant operand, and record its index in rhs
1357                  operands.  */
1358               eval_op.index = i;
1359               expr = op;
1360             }
1361           else
1362             {
1363               /* Found more than one non-constant operands.  */
1364               goto fail;
1365             }
1366         }
1367
1368       if (param_ops_p)
1369         vec_safe_insert (*param_ops_p, 0, eval_op);
1370     }
1371
1372   /* Failed to decompose, free resource and return.  */
1373 fail:
1374   if (param_ops_p)
1375     vec_free (*param_ops_p);
1376
1377   return false;
1378 }
1379
1380 /* If BB ends by a conditional we can turn into predicates, attach corresponding
1381    predicates to the CFG edges.   */
1382
1383 static void
1384 set_cond_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1385                                    class ipa_fn_summary *summary,
1386                                    class ipa_node_params *params_summary,
1387                                    basic_block bb)
1388 {
1389   gimple *last;
1390   tree op, op2;
1391   int index;
1392   struct agg_position_info aggpos;
1393   enum tree_code code, inverted_code;
1394   edge e;
1395   edge_iterator ei;
1396   gimple *set_stmt;
1397   tree param_type;
1398   expr_eval_ops param_ops;
1399
1400   last = last_stmt (bb);
1401   if (!last || gimple_code (last) != GIMPLE_COND)
1402     return;
1403   if (!is_gimple_ip_invariant (gimple_cond_rhs (last)))
1404     return;
1405   op = gimple_cond_lhs (last);
1406
1407   if (decompose_param_expr (fbi, last, op, &index, &param_type, &aggpos,
1408                             &param_ops))
1409     {
1410       code = gimple_cond_code (last);
1411       inverted_code = invert_tree_comparison (code, HONOR_NANS (op));
1412
1413       FOR_EACH_EDGE (e, ei, bb->succs)
1414         {
1415           enum tree_code this_code = (e->flags & EDGE_TRUE_VALUE
1416                                       ? code : inverted_code);
1417           /* invert_tree_comparison will return ERROR_MARK on FP
1418              comparsions that are not EQ/NE instead of returning proper
1419              unordered one.  Be sure it is not confused with NON_CONSTANT.
1420
1421              And if the edge's target is the final block of diamond CFG graph
1422              of this conditional statement, we do not need to compute
1423              predicate for the edge because the final block's predicate must
1424              be at least as that of the first block of the statement.  */
1425           if (this_code != ERROR_MARK
1426               && !dominated_by_p (CDI_POST_DOMINATORS, bb, e->dest))
1427             {
1428               predicate p
1429                 = add_condition (summary, params_summary, index,
1430                                  param_type, &aggpos,
1431                                  this_code, gimple_cond_rhs (last), param_ops);
1432               e->aux = edge_predicate_pool.allocate ();
1433               *(predicate *) e->aux = p;
1434             }
1435         }
1436       vec_free (param_ops);
1437     }
1438
1439   if (TREE_CODE (op) != SSA_NAME)
1440     return;
1441   /* Special case
1442      if (builtin_constant_p (op))
1443      constant_code
1444      else
1445      nonconstant_code.
1446      Here we can predicate nonconstant_code.  We can't
1447      really handle constant_code since we have no predicate
1448      for this and also the constant code is not known to be
1449      optimized away when inliner doen't see operand is constant.
1450      Other optimizers might think otherwise.  */
1451   if (gimple_cond_code (last) != NE_EXPR
1452       || !integer_zerop (gimple_cond_rhs (last)))
1453     return;
1454   set_stmt = SSA_NAME_DEF_STMT (op);
1455   if (!gimple_call_builtin_p (set_stmt, BUILT_IN_CONSTANT_P)
1456       || gimple_call_num_args (set_stmt) != 1)
1457     return;
1458   op2 = gimple_call_arg (set_stmt, 0);
1459   if (!decompose_param_expr (fbi, set_stmt, op2, &index, &param_type, &aggpos))
1460     return;
1461   FOR_EACH_EDGE (e, ei, bb->succs) if (e->flags & EDGE_FALSE_VALUE)
1462     {
1463       predicate p = add_condition (summary, params_summary, index,
1464                                    param_type, &aggpos,
1465                                    predicate::is_not_constant, NULL_TREE);
1466       e->aux = edge_predicate_pool.allocate ();
1467       *(predicate *) e->aux = p;
1468     }
1469 }
1470
1471
1472 /* If BB ends by a switch we can turn into predicates, attach corresponding
1473    predicates to the CFG edges.   */
1474
1475 static void
1476 set_switch_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1477                                      class ipa_fn_summary *summary,
1478                                      class ipa_node_params *params_summary,
1479                                      basic_block bb)
1480 {
1481   gimple *lastg;
1482   tree op;
1483   int index;
1484   struct agg_position_info aggpos;
1485   edge e;
1486   edge_iterator ei;
1487   size_t n;
1488   size_t case_idx;
1489   tree param_type;
1490   expr_eval_ops param_ops;
1491
1492   lastg = last_stmt (bb);
1493   if (!lastg || gimple_code (lastg) != GIMPLE_SWITCH)
1494     return;
1495   gswitch *last = as_a <gswitch *> (lastg);
1496   op = gimple_switch_index (last);
1497   if (!decompose_param_expr (fbi, last, op, &index, &param_type, &aggpos,
1498                              &param_ops))
1499     return;
1500
1501   auto_vec<std::pair<tree, tree> > ranges;
1502   tree type = TREE_TYPE (op);
1503   int bound_limit = param_ipa_max_switch_predicate_bounds;
1504   int bound_count = 0;
1505   wide_int vr_wmin, vr_wmax;
1506   value_range_kind vr_type = get_range_info (op, &vr_wmin, &vr_wmax);
1507
1508   FOR_EACH_EDGE (e, ei, bb->succs)
1509     {
1510       e->aux = edge_predicate_pool.allocate ();
1511       *(predicate *) e->aux = false;
1512     }
1513
1514   e = gimple_switch_edge (cfun, last, 0);
1515   /* Set BOUND_COUNT to maximum count to bypass computing predicate for
1516      default case if its target basic block is in convergence point of all
1517      switch cases, which can be determined by checking whether it
1518      post-dominates the switch statement.  */
1519   if (dominated_by_p (CDI_POST_DOMINATORS, bb, e->dest))
1520     bound_count = INT_MAX;
1521
1522   n = gimple_switch_num_labels (last);
1523   for (case_idx = 1; case_idx < n; ++case_idx)
1524     {
1525       tree cl = gimple_switch_label (last, case_idx);
1526       tree min = CASE_LOW (cl);
1527       tree max = CASE_HIGH (cl);
1528       predicate p;
1529
1530       e = gimple_switch_edge (cfun, last, case_idx);
1531
1532       /* The case value might not have same type as switch expression,
1533          extend the value based on the expression type.  */
1534       if (TREE_TYPE (min) != type)
1535         min = wide_int_to_tree (type, wi::to_wide (min));
1536
1537       if (!max)
1538         max = min;
1539       else if (TREE_TYPE (max) != type)
1540         max = wide_int_to_tree (type, wi::to_wide (max));
1541
1542       /* The case's target basic block is in convergence point of all switch
1543          cases, its predicate should be at least as that of the switch
1544          statement.  */
1545       if (dominated_by_p (CDI_POST_DOMINATORS, bb, e->dest))
1546         p = true;
1547       else if (min == max)
1548         p = add_condition (summary, params_summary, index, param_type,
1549                            &aggpos, EQ_EXPR, min, param_ops);
1550       else
1551         {
1552           predicate p1, p2;
1553           p1 = add_condition (summary, params_summary, index, param_type,
1554                               &aggpos, GE_EXPR, min, param_ops);
1555           p2 = add_condition (summary,  params_summary,index, param_type,
1556                               &aggpos, LE_EXPR, max, param_ops);
1557           p = p1 & p2;
1558         }
1559       *(class predicate *) e->aux
1560         = p.or_with (summary->conds, *(class predicate *) e->aux);
1561
1562       /* If there are too many disjoint case ranges, predicate for default
1563          case might become too complicated.  So add a limit here.  */
1564       if (bound_count > bound_limit)
1565         continue;
1566
1567       bool new_range = true;
1568
1569       if (!ranges.is_empty ())
1570         {
1571           wide_int curr_wmin = wi::to_wide (min);
1572           wide_int last_wmax = wi::to_wide (ranges.last ().second);
1573
1574           /* Merge case ranges if they are continuous.  */
1575           if (curr_wmin == last_wmax + 1)
1576             new_range = false;
1577           else if (vr_type == VR_ANTI_RANGE)
1578             {
1579               /* If two disjoint case ranges can be connected by anti-range
1580                  of switch index, combine them to one range.  */
1581               if (wi::lt_p (vr_wmax, curr_wmin - 1, TYPE_SIGN (type)))
1582                 vr_type = VR_UNDEFINED;
1583               else if (wi::le_p (vr_wmin, last_wmax + 1, TYPE_SIGN (type)))
1584                 new_range = false;
1585             }
1586         }
1587
1588       /* Create/extend a case range.  And we count endpoints of range set,
1589          this number nearly equals to number of conditions that we will create
1590          for predicate of default case.  */
1591       if (new_range)
1592         {
1593           bound_count += (min == max) ? 1 : 2;
1594           ranges.safe_push (std::make_pair (min, max));
1595         }
1596       else
1597         {
1598           bound_count += (ranges.last ().first == ranges.last ().second);
1599           ranges.last ().second = max;
1600         }
1601     }
1602
1603   e = gimple_switch_edge (cfun, last, 0);
1604   if (bound_count > bound_limit)
1605     {
1606       *(class predicate *) e->aux = true;
1607       vec_free (param_ops);
1608       return;
1609     }
1610
1611   predicate p_seg = true;
1612   predicate p_all = false;
1613
1614   if (vr_type != VR_RANGE)
1615     {
1616       vr_wmin = wi::to_wide (TYPE_MIN_VALUE (type));
1617       vr_wmax = wi::to_wide (TYPE_MAX_VALUE (type));
1618     }
1619
1620   /* Construct predicate to represent default range set that is negation of
1621      all case ranges.  Case range is classified as containing single/non-single
1622      values.  Suppose a piece of case ranges in the following.
1623
1624                 [D1...D2]  [S1] ... [Sn]  [D3...D4]
1625
1626      To represent default case's range sets between two non-single value
1627      case ranges (From D2 to D3), we construct predicate as:
1628
1629               D2 < x < D3 && x != S1 && ... && x != Sn
1630    */
1631   for (size_t i = 0; i < ranges.length (); i++)
1632     {
1633       tree min = ranges[i].first;
1634       tree max = ranges[i].second;
1635
1636       if (min == max)
1637         p_seg &= add_condition (summary, params_summary, index,
1638                                 param_type, &aggpos, NE_EXPR,
1639                                 min, param_ops);
1640       else
1641         {
1642           /* Do not create sub-predicate for range that is beyond low bound
1643              of switch index.  */
1644           if (wi::lt_p (vr_wmin, wi::to_wide (min), TYPE_SIGN (type)))
1645             {
1646               p_seg &= add_condition (summary, params_summary, index,
1647                                       param_type, &aggpos,
1648                                       LT_EXPR, min, param_ops);
1649               p_all = p_all.or_with (summary->conds, p_seg);
1650             }
1651
1652           /* Do not create sub-predicate for range that is beyond up bound
1653              of switch index.  */
1654           if (wi::le_p (vr_wmax, wi::to_wide (max), TYPE_SIGN (type)))
1655             {
1656               p_seg = false;
1657               break;
1658             }
1659
1660           p_seg = add_condition (summary, params_summary, index,
1661                                  param_type, &aggpos, GT_EXPR,
1662                                  max, param_ops);
1663         }
1664     }
1665
1666   p_all = p_all.or_with (summary->conds, p_seg);
1667   *(class predicate *) e->aux
1668     = p_all.or_with (summary->conds, *(class predicate *) e->aux);
1669
1670   vec_free (param_ops);
1671 }
1672
1673
1674 /* For each BB in NODE attach to its AUX pointer predicate under
1675    which it is executable.  */
1676
1677 static void
1678 compute_bb_predicates (struct ipa_func_body_info *fbi,
1679                        struct cgraph_node *node,
1680                        class ipa_fn_summary *summary,
1681                        class ipa_node_params *params_summary)
1682 {
1683   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
1684   bool done = false;
1685   basic_block bb;
1686
1687   FOR_EACH_BB_FN (bb, my_function)
1688     {
1689       set_cond_stmt_execution_predicate (fbi, summary, params_summary, bb);
1690       set_switch_stmt_execution_predicate (fbi, summary, params_summary, bb);
1691     }
1692
1693   /* Entry block is always executable.  */
1694   ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux
1695     = edge_predicate_pool.allocate ();
1696   *(predicate *) ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux = true;
1697
1698   /* A simple dataflow propagation of predicates forward in the CFG.
1699      TODO: work in reverse postorder.  */
1700   while (!done)
1701     {
1702       done = true;
1703       FOR_EACH_BB_FN (bb, my_function)
1704         {
1705           predicate p = false;
1706           edge e;
1707           edge_iterator ei;
1708           FOR_EACH_EDGE (e, ei, bb->preds)
1709             {
1710               if (e->src->aux)
1711                 {
1712                   predicate this_bb_predicate
1713                     = *(predicate *) e->src->aux;
1714                   if (e->aux)
1715                     this_bb_predicate &= (*(class predicate *) e->aux);
1716                   p = p.or_with (summary->conds, this_bb_predicate);
1717                   if (p == true)
1718                     break;
1719                 }
1720             }
1721           if (p != false)
1722             {
1723               basic_block pdom_bb;
1724
1725               if (!bb->aux)
1726                 {
1727                   done = false;
1728                   bb->aux = edge_predicate_pool.allocate ();
1729                   *((predicate *) bb->aux) = p;
1730                 }
1731               else if (p != *(predicate *) bb->aux)
1732                 {
1733                   /* This OR operation is needed to ensure monotonous data flow
1734                      in the case we hit the limit on number of clauses and the
1735                      and/or operations above give approximate answers.  */
1736                   p = p.or_with (summary->conds, *(predicate *)bb->aux);
1737                   if (p != *(predicate *) bb->aux)
1738                     {
1739                       done = false;
1740                       *((predicate *) bb->aux) = p;
1741                     }
1742                 }
1743
1744               /* For switch/if statement, we can OR-combine predicates of all
1745                  its cases/branches to get predicate for basic block in their
1746                  convergence point, but sometimes this will generate very
1747                  complicated predicate.  Actually, we can get simplified
1748                  predicate in another way by using the fact that predicate
1749                  for a basic block must also hold true for its post dominators.
1750                  To be specific, basic block in convergence point of
1751                  conditional statement should include predicate of the
1752                  statement.  */
1753               pdom_bb = get_immediate_dominator (CDI_POST_DOMINATORS, bb);
1754               if (pdom_bb == EXIT_BLOCK_PTR_FOR_FN (my_function) || !pdom_bb)
1755                 ;
1756               else if (!pdom_bb->aux)
1757                 {
1758                   done = false;
1759                   pdom_bb->aux = edge_predicate_pool.allocate ();
1760                   *((predicate *) pdom_bb->aux) = p;
1761                 }
1762               else if (p != *(predicate *) pdom_bb->aux)
1763                 {
1764                   p = p.or_with (summary->conds, *(predicate *)pdom_bb->aux);
1765                   if (p != *(predicate *) pdom_bb->aux)
1766                     {
1767                       done = false;
1768                       *((predicate *) pdom_bb->aux) = p;
1769                     }
1770                 }
1771             }
1772         }
1773     }
1774 }
1775
1776
1777 /* Return predicate specifying when the STMT might have result that is not
1778    a compile time constant.  */
1779
1780 static predicate
1781 will_be_nonconstant_expr_predicate (ipa_func_body_info *fbi,
1782                                     class ipa_fn_summary *summary,
1783                                     class ipa_node_params *params_summary,
1784                                     tree expr,
1785                                     vec<predicate> nonconstant_names)
1786 {
1787   tree parm;
1788   int index;
1789
1790   while (UNARY_CLASS_P (expr))
1791     expr = TREE_OPERAND (expr, 0);
1792
1793   parm = unmodified_parm (fbi, NULL, expr, NULL);
1794   if (parm && (index = ipa_get_param_decl_index (fbi->info, parm)) >= 0)
1795     return add_condition (summary, params_summary, index, TREE_TYPE (parm), NULL,
1796                           predicate::changed, NULL_TREE);
1797   if (is_gimple_min_invariant (expr))
1798     return false;
1799   if (TREE_CODE (expr) == SSA_NAME)
1800     return nonconstant_names[SSA_NAME_VERSION (expr)];
1801   if (BINARY_CLASS_P (expr) || COMPARISON_CLASS_P (expr))
1802     {
1803       predicate p1
1804         = will_be_nonconstant_expr_predicate (fbi, summary,
1805                                               params_summary,
1806                                               TREE_OPERAND (expr, 0),
1807                                               nonconstant_names);
1808       if (p1 == true)
1809         return p1;
1810
1811       predicate p2
1812         = will_be_nonconstant_expr_predicate (fbi, summary,
1813                                               params_summary,
1814                                               TREE_OPERAND (expr, 1),
1815                                               nonconstant_names);
1816       return p1.or_with (summary->conds, p2);
1817     }
1818   else if (TREE_CODE (expr) == COND_EXPR)
1819     {
1820       predicate p1
1821         = will_be_nonconstant_expr_predicate (fbi, summary,
1822                                               params_summary,
1823                                               TREE_OPERAND (expr, 0),
1824                                               nonconstant_names);
1825       if (p1 == true)
1826         return p1;
1827
1828       predicate p2
1829         = will_be_nonconstant_expr_predicate (fbi, summary,
1830                                               params_summary,
1831                                               TREE_OPERAND (expr, 1),
1832                                               nonconstant_names);
1833       if (p2 == true)
1834         return p2;
1835       p1 = p1.or_with (summary->conds, p2);
1836       p2 = will_be_nonconstant_expr_predicate (fbi, summary,
1837                                                params_summary,
1838                                                TREE_OPERAND (expr, 2),
1839                                                nonconstant_names);
1840       return p2.or_with (summary->conds, p1);
1841     }
1842   else if (TREE_CODE (expr) == CALL_EXPR)
1843     return true;
1844   else
1845     {
1846       debug_tree (expr);
1847       gcc_unreachable ();
1848     }
1849   return false;
1850 }
1851
1852
1853 /* Return predicate specifying when the STMT might have result that is not
1854    a compile time constant.  */
1855
1856 static predicate
1857 will_be_nonconstant_predicate (struct ipa_func_body_info *fbi,
1858                                class ipa_fn_summary *summary,
1859                                class ipa_node_params *params_summary,
1860                                gimple *stmt,
1861                                vec<predicate> nonconstant_names)
1862 {
1863   predicate p = true;
1864   ssa_op_iter iter;
1865   tree use;
1866   tree param_type = NULL_TREE;
1867   predicate op_non_const;
1868   bool is_load;
1869   int base_index;
1870   struct agg_position_info aggpos;
1871
1872   /* What statments might be optimized away
1873      when their arguments are constant.  */
1874   if (gimple_code (stmt) != GIMPLE_ASSIGN
1875       && gimple_code (stmt) != GIMPLE_COND
1876       && gimple_code (stmt) != GIMPLE_SWITCH
1877       && (gimple_code (stmt) != GIMPLE_CALL
1878           || !(gimple_call_flags (stmt) & ECF_CONST)))
1879     return p;
1880
1881   /* Stores will stay anyway.  */
1882   if (gimple_store_p (stmt))
1883     return p;
1884
1885   is_load = gimple_assign_load_p (stmt);
1886
1887   /* Loads can be optimized when the value is known.  */
1888   if (is_load)
1889     {
1890       tree op = gimple_assign_rhs1 (stmt);
1891       if (!decompose_param_expr (fbi, stmt, op, &base_index, &param_type,
1892                                  &aggpos))
1893         return p;
1894     }
1895   else
1896     base_index = -1;
1897
1898   /* See if we understand all operands before we start
1899      adding conditionals.  */
1900   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
1901     {
1902       tree parm = unmodified_parm (fbi, stmt, use, NULL);
1903       /* For arguments we can build a condition.  */
1904       if (parm && ipa_get_param_decl_index (fbi->info, parm) >= 0)
1905         continue;
1906       if (TREE_CODE (use) != SSA_NAME)
1907         return p;
1908       /* If we know when operand is constant,
1909          we still can say something useful.  */
1910       if (nonconstant_names[SSA_NAME_VERSION (use)] != true)
1911         continue;
1912       return p;
1913     }
1914
1915   if (is_load)
1916     op_non_const =
1917       add_condition (summary, params_summary,
1918                      base_index, param_type, &aggpos,
1919                      predicate::changed, NULL_TREE);
1920   else
1921     op_non_const = false;
1922   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
1923     {
1924       tree parm = unmodified_parm (fbi, stmt, use, NULL);
1925       int index;
1926
1927       if (parm && (index = ipa_get_param_decl_index (fbi->info, parm)) >= 0)
1928         {
1929           if (index != base_index)
1930             p = add_condition (summary, params_summary, index,
1931                                TREE_TYPE (parm), NULL,
1932                                predicate::changed, NULL_TREE);
1933           else
1934             continue;
1935         }
1936       else
1937         p = nonconstant_names[SSA_NAME_VERSION (use)];
1938       op_non_const = p.or_with (summary->conds, op_non_const);
1939     }
1940   if ((gimple_code (stmt) == GIMPLE_ASSIGN || gimple_code (stmt) == GIMPLE_CALL)
1941       && gimple_op (stmt, 0)
1942       && TREE_CODE (gimple_op (stmt, 0)) == SSA_NAME)
1943     nonconstant_names[SSA_NAME_VERSION (gimple_op (stmt, 0))]
1944       = op_non_const;
1945   return op_non_const;
1946 }
1947
1948 struct record_modified_bb_info
1949 {
1950   tree op;
1951   bitmap bb_set;
1952   gimple *stmt;
1953 };
1954
1955 /* Value is initialized in INIT_BB and used in USE_BB.  We want to copute
1956    probability how often it changes between USE_BB.
1957    INIT_BB->count/USE_BB->count is an estimate, but if INIT_BB
1958    is in different loop nest, we can do better.
1959    This is all just estimate.  In theory we look for minimal cut separating
1960    INIT_BB and USE_BB, but we only want to anticipate loop invariant motion
1961    anyway.  */
1962
1963 static basic_block
1964 get_minimal_bb (basic_block init_bb, basic_block use_bb)
1965 {
1966   class loop *l = find_common_loop (init_bb->loop_father, use_bb->loop_father);
1967   if (l && l->header->count < init_bb->count)
1968     return l->header;
1969   return init_bb;
1970 }
1971
1972 /* Callback of walk_aliased_vdefs.  Records basic blocks where the value may be
1973    set except for info->stmt.  */
1974
1975 static bool
1976 record_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef, void *data)
1977 {
1978   struct record_modified_bb_info *info =
1979     (struct record_modified_bb_info *) data;
1980   if (SSA_NAME_DEF_STMT (vdef) == info->stmt)
1981     return false;
1982   if (gimple_clobber_p (SSA_NAME_DEF_STMT (vdef)))
1983     return false;
1984   bitmap_set_bit (info->bb_set,
1985                   SSA_NAME_IS_DEFAULT_DEF (vdef)
1986                   ? ENTRY_BLOCK_PTR_FOR_FN (cfun)->index
1987                   : get_minimal_bb
1988                          (gimple_bb (SSA_NAME_DEF_STMT (vdef)),
1989                           gimple_bb (info->stmt))->index);
1990   if (dump_file)
1991     {
1992       fprintf (dump_file, "     Param ");
1993       print_generic_expr (dump_file, info->op, TDF_SLIM);
1994       fprintf (dump_file, " changed at bb %i, minimal: %i stmt: ",
1995                gimple_bb (SSA_NAME_DEF_STMT (vdef))->index,
1996                get_minimal_bb
1997                          (gimple_bb (SSA_NAME_DEF_STMT (vdef)),
1998                           gimple_bb (info->stmt))->index);
1999       print_gimple_stmt (dump_file, SSA_NAME_DEF_STMT (vdef), 0);
2000     }
2001   return false;
2002 }
2003
2004 /* Return probability (based on REG_BR_PROB_BASE) that I-th parameter of STMT
2005    will change since last invocation of STMT.
2006
2007    Value 0 is reserved for compile time invariants.
2008    For common parameters it is REG_BR_PROB_BASE.  For loop invariants it
2009    ought to be REG_BR_PROB_BASE / estimated_iters.  */
2010
2011 static int
2012 param_change_prob (ipa_func_body_info *fbi, gimple *stmt, int i)
2013 {
2014   tree op = gimple_call_arg (stmt, i);
2015   basic_block bb = gimple_bb (stmt);
2016
2017   if (TREE_CODE (op) == WITH_SIZE_EXPR)
2018     op = TREE_OPERAND (op, 0);
2019
2020   tree base = get_base_address (op);
2021
2022   /* Global invariants never change.  */
2023   if (is_gimple_min_invariant (base))
2024     return 0;
2025
2026   /* We would have to do non-trivial analysis to really work out what
2027      is the probability of value to change (i.e. when init statement
2028      is in a sibling loop of the call).
2029
2030      We do an conservative estimate: when call is executed N times more often
2031      than the statement defining value, we take the frequency 1/N.  */
2032   if (TREE_CODE (base) == SSA_NAME)
2033     {
2034       profile_count init_count;
2035
2036       if (!bb->count.nonzero_p ())
2037         return REG_BR_PROB_BASE;
2038
2039       if (SSA_NAME_IS_DEFAULT_DEF (base))
2040         init_count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
2041       else
2042         init_count = get_minimal_bb
2043                       (gimple_bb (SSA_NAME_DEF_STMT (base)),
2044                        gimple_bb (stmt))->count;
2045
2046       if (init_count < bb->count)
2047         return MAX ((init_count.to_sreal_scale (bb->count)
2048                      * REG_BR_PROB_BASE).to_int (), 1);
2049       return REG_BR_PROB_BASE;
2050     }
2051   else
2052     {
2053       ao_ref refd;
2054       profile_count max = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
2055       struct record_modified_bb_info info;
2056       tree init = ctor_for_folding (base);
2057
2058       if (init != error_mark_node)
2059         return 0;
2060       if (!bb->count.nonzero_p ())
2061         return REG_BR_PROB_BASE;
2062       if (dump_file)
2063         {
2064           fprintf (dump_file, "     Analyzing param change probability of ");
2065           print_generic_expr (dump_file, op, TDF_SLIM);
2066           fprintf (dump_file, "\n");
2067         }
2068       ao_ref_init (&refd, op);
2069       info.op = op;
2070       info.stmt = stmt;
2071       info.bb_set = BITMAP_ALLOC (NULL);
2072       int walked
2073         = walk_aliased_vdefs (&refd, gimple_vuse (stmt), record_modified, &info,
2074                               NULL, NULL, fbi->aa_walk_budget);
2075       if (walked < 0 || bitmap_bit_p (info.bb_set, bb->index))
2076         {
2077           if (dump_file)
2078             {
2079               if (walked < 0)
2080                 fprintf (dump_file, "     Ran out of AA walking budget.\n");
2081               else
2082                 fprintf (dump_file, "     Set in same BB as used.\n");
2083             }
2084           BITMAP_FREE (info.bb_set);
2085           return REG_BR_PROB_BASE;
2086         }
2087
2088       bitmap_iterator bi;
2089       unsigned index;
2090       /* Lookup the most frequent update of the value and believe that
2091          it dominates all the other; precise analysis here is difficult.  */
2092       EXECUTE_IF_SET_IN_BITMAP (info.bb_set, 0, index, bi)
2093         max = max.max (BASIC_BLOCK_FOR_FN (cfun, index)->count);
2094       if (dump_file)
2095         {
2096           fprintf (dump_file, "     Set with count ");
2097           max.dump (dump_file);
2098           fprintf (dump_file, " and used with count ");
2099           bb->count.dump (dump_file);
2100           fprintf (dump_file, " freq %f\n",
2101                    max.to_sreal_scale (bb->count).to_double ());
2102         }
2103
2104       BITMAP_FREE (info.bb_set);
2105       if (max < bb->count)
2106         return MAX ((max.to_sreal_scale (bb->count)
2107                      * REG_BR_PROB_BASE).to_int (), 1);
2108       return REG_BR_PROB_BASE;
2109     }
2110 }
2111
2112 /* Find whether a basic block BB is the final block of a (half) diamond CFG
2113    sub-graph and if the predicate the condition depends on is known.  If so,
2114    return true and store the pointer the predicate in *P.  */
2115
2116 static bool
2117 phi_result_unknown_predicate (ipa_func_body_info *fbi,
2118                               ipa_fn_summary *summary,
2119                               class ipa_node_params *params_summary,
2120                               basic_block bb,
2121                               predicate *p,
2122                               vec<predicate> nonconstant_names)
2123 {
2124   edge e;
2125   edge_iterator ei;
2126   basic_block first_bb = NULL;
2127   gimple *stmt;
2128
2129   if (single_pred_p (bb))
2130     {
2131       *p = false;
2132       return true;
2133     }
2134
2135   FOR_EACH_EDGE (e, ei, bb->preds)
2136     {
2137       if (single_succ_p (e->src))
2138         {
2139           if (!single_pred_p (e->src))
2140             return false;
2141           if (!first_bb)
2142             first_bb = single_pred (e->src);
2143           else if (single_pred (e->src) != first_bb)
2144             return false;
2145         }
2146       else
2147         {
2148           if (!first_bb)
2149             first_bb = e->src;
2150           else if (e->src != first_bb)
2151             return false;
2152         }
2153     }
2154
2155   if (!first_bb)
2156     return false;
2157
2158   stmt = last_stmt (first_bb);
2159   if (!stmt
2160       || gimple_code (stmt) != GIMPLE_COND
2161       || !is_gimple_ip_invariant (gimple_cond_rhs (stmt)))
2162     return false;
2163
2164   *p = will_be_nonconstant_expr_predicate (fbi, summary, params_summary,
2165                                            gimple_cond_lhs (stmt),
2166                                            nonconstant_names);
2167   if (*p == true)
2168     return false;
2169   else
2170     return true;
2171 }
2172
2173 /* Given a PHI statement in a function described by inline properties SUMMARY
2174    and *P being the predicate describing whether the selected PHI argument is
2175    known, store a predicate for the result of the PHI statement into
2176    NONCONSTANT_NAMES, if possible.  */
2177
2178 static void
2179 predicate_for_phi_result (class ipa_fn_summary *summary, gphi *phi,
2180                           predicate *p,
2181                           vec<predicate> nonconstant_names)
2182 {
2183   unsigned i;
2184
2185   for (i = 0; i < gimple_phi_num_args (phi); i++)
2186     {
2187       tree arg = gimple_phi_arg (phi, i)->def;
2188       if (!is_gimple_min_invariant (arg))
2189         {
2190           gcc_assert (TREE_CODE (arg) == SSA_NAME);
2191           *p = p->or_with (summary->conds,
2192                            nonconstant_names[SSA_NAME_VERSION (arg)]);
2193           if (*p == true)
2194             return;
2195         }
2196     }
2197
2198   if (dump_file && (dump_flags & TDF_DETAILS))
2199     {
2200       fprintf (dump_file, "\t\tphi predicate: ");
2201       p->dump (dump_file, summary->conds);
2202     }
2203   nonconstant_names[SSA_NAME_VERSION (gimple_phi_result (phi))] = *p;
2204 }
2205
2206 /* For a typical usage of __builtin_expect (a<b, 1), we
2207    may introduce an extra relation stmt:
2208    With the builtin, we have
2209      t1 = a <= b;
2210      t2 = (long int) t1;
2211      t3 = __builtin_expect (t2, 1);
2212      if (t3 != 0)
2213        goto ...
2214    Without the builtin, we have
2215      if (a<=b)
2216        goto...
2217    This affects the size/time estimation and may have
2218    an impact on the earlier inlining.
2219    Here find this pattern and fix it up later.  */
2220
2221 static gimple *
2222 find_foldable_builtin_expect (basic_block bb)
2223 {
2224   gimple_stmt_iterator bsi;
2225
2226   for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
2227     {
2228       gimple *stmt = gsi_stmt (bsi);
2229       if (gimple_call_builtin_p (stmt, BUILT_IN_EXPECT)
2230           || gimple_call_builtin_p (stmt, BUILT_IN_EXPECT_WITH_PROBABILITY)
2231           || gimple_call_internal_p (stmt, IFN_BUILTIN_EXPECT))
2232         {
2233           tree var = gimple_call_lhs (stmt);
2234           tree arg = gimple_call_arg (stmt, 0);
2235           use_operand_p use_p;
2236           gimple *use_stmt;
2237           bool match = false;
2238           bool done = false;
2239
2240           if (!var || !arg)
2241             continue;
2242           gcc_assert (TREE_CODE (var) == SSA_NAME);
2243
2244           while (TREE_CODE (arg) == SSA_NAME)
2245             {
2246               gimple *stmt_tmp = SSA_NAME_DEF_STMT (arg);
2247               if (!is_gimple_assign (stmt_tmp))
2248                 break;
2249               switch (gimple_assign_rhs_code (stmt_tmp))
2250                 {
2251                   case LT_EXPR:
2252                   case LE_EXPR:
2253                   case GT_EXPR:
2254                   case GE_EXPR:
2255                   case EQ_EXPR:
2256                   case NE_EXPR:
2257                     match = true;
2258                     done = true;
2259                     break;
2260                   CASE_CONVERT:
2261                     break;
2262                   default:
2263                     done = true;
2264                     break;
2265                 }
2266               if (done)
2267                 break;
2268               arg = gimple_assign_rhs1 (stmt_tmp);
2269             }
2270
2271           if (match && single_imm_use (var, &use_p, &use_stmt)
2272               && gimple_code (use_stmt) == GIMPLE_COND)
2273             return use_stmt;
2274         }
2275     }
2276   return NULL;
2277 }
2278
2279 /* Return true when the basic blocks contains only clobbers followed by RESX.
2280    Such BBs are kept around to make removal of dead stores possible with
2281    presence of EH and will be optimized out by optimize_clobbers later in the
2282    game.
2283
2284    NEED_EH is used to recurse in case the clobber has non-EH predecestors
2285    that can be clobber only, too.. When it is false, the RESX is not necessary
2286    on the end of basic block.  */
2287
2288 static bool
2289 clobber_only_eh_bb_p (basic_block bb, bool need_eh = true)
2290 {
2291   gimple_stmt_iterator gsi = gsi_last_bb (bb);
2292   edge_iterator ei;
2293   edge e;
2294
2295   if (need_eh)
2296     {
2297       if (gsi_end_p (gsi))
2298         return false;
2299       if (gimple_code (gsi_stmt (gsi)) != GIMPLE_RESX)
2300         return false;
2301       gsi_prev (&gsi);
2302     }
2303   else if (!single_succ_p (bb))
2304     return false;
2305
2306   for (; !gsi_end_p (gsi); gsi_prev (&gsi))
2307     {
2308       gimple *stmt = gsi_stmt (gsi);
2309       if (is_gimple_debug (stmt))
2310         continue;
2311       if (gimple_clobber_p (stmt))
2312         continue;
2313       if (gimple_code (stmt) == GIMPLE_LABEL)
2314         break;
2315       return false;
2316     }
2317
2318   /* See if all predecestors are either throws or clobber only BBs.  */
2319   FOR_EACH_EDGE (e, ei, bb->preds)
2320     if (!(e->flags & EDGE_EH)
2321         && !clobber_only_eh_bb_p (e->src, false))
2322       return false;
2323
2324   return true;
2325 }
2326
2327 /* Return true if STMT compute a floating point expression that may be affected
2328    by -ffast-math and similar flags.  */
2329
2330 static bool
2331 fp_expression_p (gimple *stmt)
2332 {
2333   ssa_op_iter i;
2334   tree op;
2335
2336   FOR_EACH_SSA_TREE_OPERAND (op, stmt, i, SSA_OP_DEF|SSA_OP_USE)
2337     if (FLOAT_TYPE_P (TREE_TYPE (op)))
2338       return true;
2339   return false;
2340 }
2341
2342 /* Analyze function body for NODE.
2343    EARLY indicates run from early optimization pipeline.  */
2344
2345 static void
2346 analyze_function_body (struct cgraph_node *node, bool early)
2347 {
2348   sreal time = param_uninlined_function_time;
2349   /* Estimate static overhead for function prologue/epilogue and alignment. */
2350   int size = param_uninlined_function_insns;
2351   /* Benefits are scaled by probability of elimination that is in range
2352      <0,2>.  */
2353   basic_block bb;
2354   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
2355   sreal freq;
2356   class ipa_fn_summary *info = ipa_fn_summaries->get_create (node);
2357   class ipa_node_params *params_summary = early ? NULL : IPA_NODE_REF (node);
2358   predicate bb_predicate;
2359   struct ipa_func_body_info fbi;
2360   vec<predicate> nonconstant_names = vNULL;
2361   int nblocks, n;
2362   int *order;
2363   gimple *fix_builtin_expect_stmt;
2364
2365   gcc_assert (my_function && my_function->cfg);
2366   gcc_assert (cfun == my_function);
2367
2368   memset(&fbi, 0, sizeof(fbi));
2369   vec_free (info->conds);
2370   info->conds = NULL;
2371   vec_free (info->size_time_table);
2372   info->size_time_table = NULL;
2373
2374   /* When optimizing and analyzing for IPA inliner, initialize loop optimizer
2375      so we can produce proper inline hints.
2376
2377      When optimizing and analyzing for early inliner, initialize node params
2378      so we can produce correct BB predicates.  */
2379
2380   if (opt_for_fn (node->decl, optimize))
2381     {
2382       calculate_dominance_info (CDI_DOMINATORS);
2383       calculate_dominance_info (CDI_POST_DOMINATORS);
2384       if (!early)
2385         loop_optimizer_init (LOOPS_NORMAL | LOOPS_HAVE_RECORDED_EXITS);
2386       else
2387         {
2388           ipa_check_create_node_params ();
2389           ipa_initialize_node_params (node);
2390         }
2391
2392       if (ipa_node_params_sum)
2393         {
2394           fbi.node = node;
2395           fbi.info = IPA_NODE_REF (node);
2396           fbi.bb_infos = vNULL;
2397           fbi.bb_infos.safe_grow_cleared (last_basic_block_for_fn (cfun));
2398           fbi.param_count = count_formal_params (node->decl);
2399           fbi.aa_walk_budget = param_ipa_max_aa_steps;
2400
2401           nonconstant_names.safe_grow_cleared
2402             (SSANAMES (my_function)->length ());
2403         }
2404     }
2405
2406   if (dump_file)
2407     fprintf (dump_file, "\nAnalyzing function body size: %s\n",
2408              node->name ());
2409
2410   /* When we run into maximal number of entries, we assign everything to the
2411      constant truth case.  Be sure to have it in list. */
2412   bb_predicate = true;
2413   info->account_size_time (0, 0, bb_predicate, bb_predicate);
2414
2415   bb_predicate = predicate::not_inlined ();
2416   info->account_size_time (param_uninlined_function_insns
2417                            * ipa_fn_summary::size_scale,
2418                            param_uninlined_function_time,
2419                            bb_predicate,
2420                            bb_predicate);
2421
2422   if (fbi.info)
2423     compute_bb_predicates (&fbi, node, info, params_summary);
2424   order = XNEWVEC (int, n_basic_blocks_for_fn (cfun));
2425   nblocks = pre_and_rev_post_order_compute (NULL, order, false);
2426   for (n = 0; n < nblocks; n++)
2427     {
2428       bb = BASIC_BLOCK_FOR_FN (cfun, order[n]);
2429       freq = bb->count.to_sreal_scale (ENTRY_BLOCK_PTR_FOR_FN (cfun)->count);
2430       if (clobber_only_eh_bb_p (bb))
2431         {
2432           if (dump_file && (dump_flags & TDF_DETAILS))
2433             fprintf (dump_file, "\n Ignoring BB %i;"
2434                      " it will be optimized away by cleanup_clobbers\n",
2435                      bb->index);
2436           continue;
2437         }
2438
2439       /* TODO: Obviously predicates can be propagated down across CFG.  */
2440       if (fbi.info)
2441         {
2442           if (bb->aux)
2443             bb_predicate = *(predicate *) bb->aux;
2444           else
2445             bb_predicate = false;
2446         }
2447       else
2448         bb_predicate = true;
2449
2450       if (dump_file && (dump_flags & TDF_DETAILS))
2451         {
2452           fprintf (dump_file, "\n BB %i predicate:", bb->index);
2453           bb_predicate.dump (dump_file, info->conds);
2454         }
2455
2456       if (fbi.info && nonconstant_names.exists ())
2457         {
2458           predicate phi_predicate;
2459           bool first_phi = true;
2460
2461           for (gphi_iterator bsi = gsi_start_phis (bb); !gsi_end_p (bsi);
2462                gsi_next (&bsi))
2463             {
2464               if (first_phi
2465                   && !phi_result_unknown_predicate (&fbi, info,
2466                                                     params_summary,
2467                                                     bb,
2468                                                     &phi_predicate,
2469                                                     nonconstant_names))
2470                 break;
2471               first_phi = false;
2472               if (dump_file && (dump_flags & TDF_DETAILS))
2473                 {
2474                   fprintf (dump_file, "  ");
2475                   print_gimple_stmt (dump_file, gsi_stmt (bsi), 0);
2476                 }
2477               predicate_for_phi_result (info, bsi.phi (), &phi_predicate,
2478                                         nonconstant_names);
2479             }
2480         }
2481
2482       fix_builtin_expect_stmt = find_foldable_builtin_expect (bb);
2483
2484       for (gimple_stmt_iterator bsi = gsi_start_nondebug_bb (bb);
2485            !gsi_end_p (bsi); gsi_next_nondebug (&bsi))
2486         {
2487           gimple *stmt = gsi_stmt (bsi);
2488           int this_size = estimate_num_insns (stmt, &eni_size_weights);
2489           int this_time = estimate_num_insns (stmt, &eni_time_weights);
2490           int prob;
2491           predicate will_be_nonconstant;
2492
2493           /* This relation stmt should be folded after we remove
2494              buildin_expect call. Adjust the cost here.  */
2495           if (stmt == fix_builtin_expect_stmt)
2496             {
2497               this_size--;
2498               this_time--;
2499             }
2500
2501           if (dump_file && (dump_flags & TDF_DETAILS))
2502             {
2503               fprintf (dump_file, "  ");
2504               print_gimple_stmt (dump_file, stmt, 0);
2505               fprintf (dump_file, "\t\tfreq:%3.2f size:%3i time:%3i\n",
2506                        freq.to_double (), this_size,
2507                        this_time);
2508             }
2509
2510           if (is_gimple_call (stmt)
2511               && !gimple_call_internal_p (stmt))
2512             {
2513               struct cgraph_edge *edge = node->get_edge (stmt);
2514               ipa_call_summary *es = ipa_call_summaries->get_create (edge);
2515
2516               /* Special case: results of BUILT_IN_CONSTANT_P will be always
2517                  resolved as constant.  We however don't want to optimize
2518                  out the cgraph edges.  */
2519               if (nonconstant_names.exists ()
2520                   && gimple_call_builtin_p (stmt, BUILT_IN_CONSTANT_P)
2521                   && gimple_call_lhs (stmt)
2522                   && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
2523                 {
2524                   predicate false_p = false;
2525                   nonconstant_names[SSA_NAME_VERSION (gimple_call_lhs (stmt))]
2526                     = false_p;
2527                 }
2528               if (ipa_node_params_sum)
2529                 {
2530                   int count = gimple_call_num_args (stmt);
2531                   int i;
2532
2533                   if (count)
2534                     es->param.safe_grow_cleared (count);
2535                   for (i = 0; i < count; i++)
2536                     {
2537                       int prob = param_change_prob (&fbi, stmt, i);
2538                       gcc_assert (prob >= 0 && prob <= REG_BR_PROB_BASE);
2539                       es->param[i].change_prob = prob;
2540                     }
2541                 }
2542
2543               es->call_stmt_size = this_size;
2544               es->call_stmt_time = this_time;
2545               es->loop_depth = bb_loop_depth (bb);
2546               edge_set_predicate (edge, &bb_predicate);
2547               if (edge->speculative)
2548                 {
2549                   cgraph_edge *direct, *indirect;
2550                   ipa_ref *ref;
2551                   edge->speculative_call_info (direct, indirect, ref);
2552                   gcc_assert (direct == edge);
2553                   ipa_call_summary *es2
2554                          = ipa_call_summaries->get_create (indirect);
2555                   ipa_call_summaries->duplicate (edge, indirect,
2556                                                  es, es2);
2557                 }
2558             }
2559
2560           /* TODO: When conditional jump or swithc is known to be constant, but
2561              we did not translate it into the predicates, we really can account
2562              just maximum of the possible paths.  */
2563           if (fbi.info)
2564             will_be_nonconstant
2565               = will_be_nonconstant_predicate (&fbi, info, params_summary,
2566                                                stmt, nonconstant_names);
2567           else
2568             will_be_nonconstant = true;
2569           if (this_time || this_size)
2570             {
2571               sreal final_time = (sreal)this_time * freq;
2572
2573               prob = eliminated_by_inlining_prob (&fbi, stmt);
2574               if (prob == 1 && dump_file && (dump_flags & TDF_DETAILS))
2575                 fprintf (dump_file,
2576                          "\t\t50%% will be eliminated by inlining\n");
2577               if (prob == 2 && dump_file && (dump_flags & TDF_DETAILS))
2578                 fprintf (dump_file, "\t\tWill be eliminated by inlining\n");
2579
2580               class predicate p = bb_predicate & will_be_nonconstant;
2581
2582               /* We can ignore statement when we proved it is never going
2583                  to happen, but we cannot do that for call statements
2584                  because edges are accounted specially.  */
2585
2586               if (*(is_gimple_call (stmt) ? &bb_predicate : &p) != false)
2587                 {
2588                   time += final_time;
2589                   size += this_size;
2590                 }
2591
2592               /* We account everything but the calls.  Calls have their own
2593                  size/time info attached to cgraph edges.  This is necessary
2594                  in order to make the cost disappear after inlining.  */
2595               if (!is_gimple_call (stmt))
2596                 {
2597                   if (prob)
2598                     {
2599                       predicate ip = bb_predicate & predicate::not_inlined ();
2600                       info->account_size_time (this_size * prob,
2601                                                (final_time * prob) / 2, ip,
2602                                                p);
2603                     }
2604                   if (prob != 2)
2605                     info->account_size_time (this_size * (2 - prob),
2606                                              (final_time * (2 - prob) / 2),
2607                                              bb_predicate,
2608                                              p);
2609                 }
2610
2611               if (!info->fp_expressions && fp_expression_p (stmt))
2612                 {
2613                   info->fp_expressions = true;
2614                   if (dump_file)
2615                     fprintf (dump_file, "   fp_expression set\n");
2616                 }
2617             }
2618
2619           /* Account cost of address calculations in the statements.  */
2620           for (unsigned int i = 0; i < gimple_num_ops (stmt); i++)
2621             {
2622               for (tree op = gimple_op (stmt, i);
2623                    op && handled_component_p (op);
2624                    op = TREE_OPERAND (op, 0))
2625                 if ((TREE_CODE (op) == ARRAY_REF
2626                      || TREE_CODE (op) == ARRAY_RANGE_REF)
2627                     && TREE_CODE (TREE_OPERAND (op, 1)) == SSA_NAME)
2628                   {
2629                     predicate p = bb_predicate;
2630                     if (fbi.info)
2631                       p = p & will_be_nonconstant_expr_predicate
2632                                  (&fbi, info, params_summary,
2633                                   TREE_OPERAND (op, 1),
2634                                   nonconstant_names);
2635                     if (p != false)
2636                       {
2637                         time += freq;
2638                         size += 1;
2639                         if (dump_file)
2640                           fprintf (dump_file,
2641                                    "\t\tAccounting address calculation.\n");
2642                         info->account_size_time (ipa_fn_summary::size_scale,
2643                                                  freq,
2644                                                  bb_predicate,
2645                                                  p);
2646                       }
2647                   }
2648             }
2649
2650         }
2651     }
2652   free (order);
2653
2654   if (nonconstant_names.exists () && !early)
2655     {
2656       class loop *loop;
2657       predicate loop_iterations = true;
2658       predicate loop_stride = true;
2659
2660       if (dump_file && (dump_flags & TDF_DETAILS))
2661         flow_loops_dump (dump_file, NULL, 0);
2662       scev_initialize ();
2663       FOR_EACH_LOOP (loop, 0)
2664         {
2665           vec<edge> exits;
2666           edge ex;
2667           unsigned int j;
2668           class tree_niter_desc niter_desc;
2669           bb_predicate = *(predicate *) loop->header->aux;
2670
2671           exits = get_loop_exit_edges (loop);
2672           FOR_EACH_VEC_ELT (exits, j, ex)
2673             if (number_of_iterations_exit (loop, ex, &niter_desc, false)
2674                 && !is_gimple_min_invariant (niter_desc.niter))
2675             {
2676               predicate will_be_nonconstant
2677                 = will_be_nonconstant_expr_predicate (&fbi, info,
2678                                                       params_summary,
2679                                                       niter_desc.niter,
2680                                                       nonconstant_names);
2681               if (will_be_nonconstant != true)
2682                 will_be_nonconstant = bb_predicate & will_be_nonconstant;
2683               if (will_be_nonconstant != true
2684                   && will_be_nonconstant != false)
2685                 /* This is slightly inprecise.  We may want to represent each
2686                    loop with independent predicate.  */
2687                 loop_iterations &= will_be_nonconstant;
2688             }
2689           exits.release ();
2690         }
2691
2692       /* To avoid quadratic behavior we analyze stride predicates only
2693          with respect to the containing loop.  Thus we simply iterate
2694          over all defs in the outermost loop body.  */
2695       for (loop = loops_for_fn (cfun)->tree_root->inner;
2696            loop != NULL; loop = loop->next)
2697         {
2698           basic_block *body = get_loop_body (loop);
2699           for (unsigned i = 0; i < loop->num_nodes; i++)
2700             {
2701               gimple_stmt_iterator gsi;
2702               bb_predicate = *(predicate *) body[i]->aux;
2703               for (gsi = gsi_start_bb (body[i]); !gsi_end_p (gsi);
2704                    gsi_next (&gsi))
2705                 {
2706                   gimple *stmt = gsi_stmt (gsi);
2707
2708                   if (!is_gimple_assign (stmt))
2709                     continue;
2710
2711                   tree def = gimple_assign_lhs (stmt);
2712                   if (TREE_CODE (def) != SSA_NAME)
2713                     continue;
2714
2715                   affine_iv iv;
2716                   if (!simple_iv (loop_containing_stmt (stmt),
2717                                   loop_containing_stmt (stmt),
2718                                   def, &iv, true)
2719                       || is_gimple_min_invariant (iv.step))
2720                     continue;
2721
2722                   predicate will_be_nonconstant
2723                     = will_be_nonconstant_expr_predicate (&fbi, info,
2724                                                           params_summary,
2725                                                           iv.step,
2726                                                           nonconstant_names);
2727                   if (will_be_nonconstant != true)
2728                     will_be_nonconstant = bb_predicate & will_be_nonconstant;
2729                   if (will_be_nonconstant != true
2730                       && will_be_nonconstant != false)
2731                     /* This is slightly inprecise.  We may want to represent
2732                        each loop with independent predicate.  */
2733                     loop_stride = loop_stride & will_be_nonconstant;
2734                 }
2735             }
2736           free (body);
2737         }
2738       ipa_fn_summary *s = ipa_fn_summaries->get (node);
2739       set_hint_predicate (&s->loop_iterations, loop_iterations);
2740       set_hint_predicate (&s->loop_stride, loop_stride);
2741       scev_finalize ();
2742     }
2743   FOR_ALL_BB_FN (bb, my_function)
2744     {
2745       edge e;
2746       edge_iterator ei;
2747
2748       if (bb->aux)
2749         edge_predicate_pool.remove ((predicate *)bb->aux);
2750       bb->aux = NULL;
2751       FOR_EACH_EDGE (e, ei, bb->succs)
2752         {
2753           if (e->aux)
2754             edge_predicate_pool.remove ((predicate *) e->aux);
2755           e->aux = NULL;
2756         }
2757     }
2758   ipa_fn_summary *s = ipa_fn_summaries->get (node);
2759   ipa_size_summary *ss = ipa_size_summaries->get (node);
2760   s->time = time;
2761   ss->self_size = size;
2762   nonconstant_names.release ();
2763   ipa_release_body_info (&fbi);
2764   if (opt_for_fn (node->decl, optimize))
2765     {
2766       if (!early)
2767         loop_optimizer_finalize ();
2768       else if (!ipa_edge_args_sum)
2769         ipa_free_all_node_params ();
2770       free_dominance_info (CDI_DOMINATORS);
2771       free_dominance_info (CDI_POST_DOMINATORS);
2772     }
2773   if (dump_file)
2774     {
2775       fprintf (dump_file, "\n");
2776       ipa_dump_fn_summary (dump_file, node);
2777     }
2778 }
2779
2780
2781 /* Compute function summary.
2782    EARLY is true when we compute parameters during early opts.  */
2783
2784 void
2785 compute_fn_summary (struct cgraph_node *node, bool early)
2786 {
2787   HOST_WIDE_INT self_stack_size;
2788   struct cgraph_edge *e;
2789
2790   gcc_assert (!node->inlined_to);
2791
2792   if (!ipa_fn_summaries)
2793     ipa_fn_summary_alloc ();
2794
2795   /* Create a new ipa_fn_summary.  */
2796   ((ipa_fn_summary_t *)ipa_fn_summaries)->remove_callees (node);
2797   ipa_fn_summaries->remove (node);
2798   class ipa_fn_summary *info = ipa_fn_summaries->get_create (node);
2799   class ipa_size_summary *size_info = ipa_size_summaries->get_create (node);
2800
2801   /* Estimate the stack size for the function if we're optimizing.  */
2802   self_stack_size = optimize && !node->thunk.thunk_p
2803                     ? estimated_stack_frame_size (node) : 0;
2804   size_info->estimated_self_stack_size = self_stack_size;
2805   info->estimated_stack_size = self_stack_size;
2806
2807   if (node->thunk.thunk_p)
2808     {
2809       ipa_call_summary *es = ipa_call_summaries->get_create (node->callees);
2810       predicate t = true;
2811
2812       node->can_change_signature = false;
2813       es->call_stmt_size = eni_size_weights.call_cost;
2814       es->call_stmt_time = eni_time_weights.call_cost;
2815       info->account_size_time (ipa_fn_summary::size_scale
2816                                * param_uninlined_function_thunk_insns,
2817                                param_uninlined_function_thunk_time, t, t);
2818       t = predicate::not_inlined ();
2819       info->account_size_time (2 * ipa_fn_summary::size_scale, 0, t, t);
2820       ipa_update_overall_fn_summary (node);
2821       size_info->self_size = size_info->size;
2822       if (stdarg_p (TREE_TYPE (node->decl)))
2823         {
2824           info->inlinable = false;
2825           node->callees->inline_failed = CIF_VARIADIC_THUNK;
2826         }
2827       else
2828         info->inlinable = true;
2829     }
2830   else
2831     {
2832        /* Even is_gimple_min_invariant rely on current_function_decl.  */
2833        push_cfun (DECL_STRUCT_FUNCTION (node->decl));
2834
2835        /* Can this function be inlined at all?  */
2836        if (!opt_for_fn (node->decl, optimize)
2837            && !lookup_attribute ("always_inline",
2838                                  DECL_ATTRIBUTES (node->decl)))
2839          info->inlinable = false;
2840        else
2841          info->inlinable = tree_inlinable_function_p (node->decl);
2842
2843        /* Type attributes can use parameter indices to describe them.  */
2844        if (TYPE_ATTRIBUTES (TREE_TYPE (node->decl))
2845            /* Likewise for #pragma omp declare simd functions or functions
2846               with simd attribute.  */
2847            || lookup_attribute ("omp declare simd",
2848                                 DECL_ATTRIBUTES (node->decl)))
2849          node->can_change_signature = false;
2850        else
2851          {
2852            /* Otherwise, inlinable functions always can change signature.  */
2853            if (info->inlinable)
2854              node->can_change_signature = true;
2855            else
2856              {
2857                /* Functions calling builtin_apply cannot change signature.  */
2858                for (e = node->callees; e; e = e->next_callee)
2859                  {
2860                    tree cdecl = e->callee->decl;
2861                    if (fndecl_built_in_p (cdecl, BUILT_IN_APPLY_ARGS)
2862                        || fndecl_built_in_p (cdecl, BUILT_IN_VA_START))
2863                      break;
2864                  }
2865                node->can_change_signature = !e;
2866              }
2867          }
2868        analyze_function_body (node, early);
2869        pop_cfun ();
2870      }
2871   for (e = node->callees; e; e = e->next_callee)
2872     if (e->callee->comdat_local_p ())
2873       break;
2874   node->calls_comdat_local = (e != NULL);
2875
2876   /* Inlining characteristics are maintained by the cgraph_mark_inline.  */
2877   size_info->size = size_info->self_size;
2878   info->estimated_stack_size = size_info->estimated_self_stack_size;
2879
2880   /* Code above should compute exactly the same result as
2881      ipa_update_overall_fn_summary but because computation happens in
2882      different order the roundoff errors result in slight changes.  */
2883   ipa_update_overall_fn_summary (node);
2884   /* In LTO mode we may have speculative edges set.  */
2885   gcc_assert (in_lto_p || size_info->size == size_info->self_size);
2886 }
2887
2888
2889 /* Compute parameters of functions used by inliner using
2890    current_function_decl.  */
2891
2892 static unsigned int
2893 compute_fn_summary_for_current (void)
2894 {
2895   compute_fn_summary (cgraph_node::get (current_function_decl), true);
2896   return 0;
2897 }
2898
2899 /* Estimate benefit devirtualizing indirect edge IE, provided KNOWN_VALS,
2900    KNOWN_CONTEXTS and KNOWN_AGGS.  */
2901
2902 static bool
2903 estimate_edge_devirt_benefit (struct cgraph_edge *ie,
2904                               int *size, int *time,
2905                               vec<tree> known_vals,
2906                               vec<ipa_polymorphic_call_context> known_contexts,
2907                               vec<ipa_agg_value_set> known_aggs)
2908 {
2909   tree target;
2910   struct cgraph_node *callee;
2911   class ipa_fn_summary *isummary;
2912   enum availability avail;
2913   bool speculative;
2914
2915   if (!known_vals.exists () && !known_contexts.exists ())
2916     return false;
2917   if (!opt_for_fn (ie->caller->decl, flag_indirect_inlining))
2918     return false;
2919
2920   target = ipa_get_indirect_edge_target (ie, known_vals, known_contexts,
2921                                          known_aggs, &speculative);
2922   if (!target || speculative)
2923     return false;
2924
2925   /* Account for difference in cost between indirect and direct calls.  */
2926   *size -= (eni_size_weights.indirect_call_cost - eni_size_weights.call_cost);
2927   *time -= (eni_time_weights.indirect_call_cost - eni_time_weights.call_cost);
2928   gcc_checking_assert (*time >= 0);
2929   gcc_checking_assert (*size >= 0);
2930
2931   callee = cgraph_node::get (target);
2932   if (!callee || !callee->definition)
2933     return false;
2934   callee = callee->function_symbol (&avail);
2935   if (avail < AVAIL_AVAILABLE)
2936     return false;
2937   isummary = ipa_fn_summaries->get (callee);
2938   if (isummary == NULL)
2939     return false;
2940
2941   return isummary->inlinable;
2942 }
2943
2944 /* Increase SIZE, MIN_SIZE (if non-NULL) and TIME for size and time needed to
2945    handle edge E with probability PROB.
2946    Set HINTS if edge may be devirtualized.
2947    KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS describe context of the call
2948    site.  */
2949
2950 static inline void
2951 estimate_edge_size_and_time (struct cgraph_edge *e, int *size, int *min_size,
2952                              sreal *time,
2953                              int prob,
2954                              vec<tree> known_vals,
2955                              vec<ipa_polymorphic_call_context> known_contexts,
2956                              vec<ipa_agg_value_set> known_aggs,
2957                              ipa_hints *hints)
2958 {
2959   class ipa_call_summary *es = ipa_call_summaries->get (e);
2960   int call_size = es->call_stmt_size;
2961   int call_time = es->call_stmt_time;
2962   int cur_size;
2963   if (!e->callee && hints && e->maybe_hot_p ()
2964       && estimate_edge_devirt_benefit (e, &call_size, &call_time,
2965                                        known_vals, known_contexts, known_aggs))
2966     *hints |= INLINE_HINT_indirect_call;
2967   cur_size = call_size * ipa_fn_summary::size_scale;
2968   *size += cur_size;
2969   if (min_size)
2970     *min_size += cur_size;
2971   if (!time)
2972     ;
2973   else if (prob == REG_BR_PROB_BASE)
2974     *time += ((sreal)call_time) * e->sreal_frequency ();
2975   else
2976     *time += ((sreal)call_time * prob) * e->sreal_frequency ();
2977 }
2978
2979
2980
2981 /* Increase SIZE, MIN_SIZE and TIME for size and time needed to handle all
2982    calls in NODE.  POSSIBLE_TRUTHS, KNOWN_VALS, KNOWN_AGGS and KNOWN_CONTEXTS
2983    describe context of the call site.  */
2984
2985 static void
2986 estimate_calls_size_and_time (struct cgraph_node *node, int *size,
2987                               int *min_size, sreal *time,
2988                               ipa_hints *hints,
2989                               clause_t possible_truths,
2990                               vec<tree> known_vals,
2991                               vec<ipa_polymorphic_call_context> known_contexts,
2992                               vec<ipa_agg_value_set> known_aggs)
2993 {
2994   struct cgraph_edge *e;
2995   for (e = node->callees; e; e = e->next_callee)
2996     {
2997       if (!e->inline_failed)
2998         {
2999           gcc_checking_assert (!ipa_call_summaries->get (e));
3000           estimate_calls_size_and_time (e->callee, size, min_size, time,
3001                                         hints,
3002                                         possible_truths,
3003                                         known_vals, known_contexts,
3004                                         known_aggs);
3005           continue;
3006         }
3007       class ipa_call_summary *es = ipa_call_summaries->get (e);
3008
3009       /* Do not care about zero sized builtins.  */
3010       if (!es->call_stmt_size)
3011         {
3012           gcc_checking_assert (!es->call_stmt_time);
3013           continue;
3014         }
3015       if (!es->predicate
3016           || es->predicate->evaluate (possible_truths))
3017         {
3018           /* Predicates of calls shall not use NOT_CHANGED codes,
3019              sowe do not need to compute probabilities.  */
3020           estimate_edge_size_and_time (e, size,
3021                                        es->predicate ? NULL : min_size,
3022                                        time, REG_BR_PROB_BASE,
3023                                        known_vals, known_contexts,
3024                                        known_aggs, hints);
3025         }
3026     }
3027   for (e = node->indirect_calls; e; e = e->next_callee)
3028     {
3029       class ipa_call_summary *es = ipa_call_summaries->get (e);
3030       if (!es->predicate
3031           || es->predicate->evaluate (possible_truths))
3032         estimate_edge_size_and_time (e, size,
3033                                      es->predicate ? NULL : min_size,
3034                                      time, REG_BR_PROB_BASE,
3035                                      known_vals, known_contexts, known_aggs,
3036                                      hints);
3037     }
3038 }
3039
3040 /* Default constructor for ipa call context.
3041    Memory alloction of known_vals, known_contexts
3042    and known_aggs vectors is owned by the caller, but can
3043    be release by ipa_call_context::release.
3044
3045    inline_param_summary is owned by the caller.  */
3046 ipa_call_context::ipa_call_context (cgraph_node *node,
3047                                     clause_t possible_truths,
3048                                     clause_t nonspec_possible_truths,
3049                                     vec<tree> known_vals,
3050                                     vec<ipa_polymorphic_call_context>
3051                                          known_contexts,
3052                                     vec<ipa_agg_value_set> known_aggs,
3053                                     vec<inline_param_summary>
3054                                          inline_param_summary)
3055 : m_node (node), m_possible_truths (possible_truths),
3056   m_nonspec_possible_truths (nonspec_possible_truths),
3057   m_inline_param_summary (inline_param_summary),
3058   m_known_vals (known_vals),
3059   m_known_contexts (known_contexts),
3060   m_known_aggs (known_aggs)
3061 {
3062 }
3063
3064 /* Set THIS to be a duplicate of CTX.  Copy all relevant info.  */
3065
3066 void
3067 ipa_call_context::duplicate_from (const ipa_call_context &ctx)
3068 {
3069   m_node = ctx.m_node;
3070   m_possible_truths = ctx.m_possible_truths;
3071   m_nonspec_possible_truths = ctx.m_nonspec_possible_truths;
3072   class ipa_node_params *params_summary = IPA_NODE_REF (m_node);
3073   unsigned int nargs = params_summary
3074                        ? ipa_get_param_count (params_summary) : 0;
3075
3076   m_inline_param_summary = vNULL;
3077   /* Copy the info only if there is at least one useful entry.  */
3078   if (ctx.m_inline_param_summary.exists ())
3079     {
3080       unsigned int n = MIN (ctx.m_inline_param_summary.length (), nargs);
3081
3082       for (unsigned int i = 0; i < n; i++)
3083         if (ipa_is_param_used_by_ipa_predicates (params_summary, i)
3084             && !ctx.m_inline_param_summary[i].useless_p ())
3085           {
3086             m_inline_param_summary
3087                     = ctx.m_inline_param_summary.copy ();
3088             break;
3089           }
3090     }
3091   m_known_vals = vNULL;
3092   if (ctx.m_known_vals.exists ())
3093     {
3094       unsigned int n = MIN (ctx.m_known_vals.length (), nargs);
3095
3096       for (unsigned int i = 0; i < n; i++)
3097         if (ipa_is_param_used_by_indirect_call (params_summary, i)
3098             && ctx.m_known_vals[i])
3099           {
3100             m_known_vals = ctx.m_known_vals.copy ();
3101             break;
3102           }
3103     }
3104
3105   m_known_contexts = vNULL;
3106   if (ctx.m_known_contexts.exists ())
3107     {
3108       unsigned int n = MIN (ctx.m_known_contexts.length (), nargs);
3109
3110       for (unsigned int i = 0; i < n; i++)
3111         if (ipa_is_param_used_by_polymorphic_call (params_summary, i)
3112             && !ctx.m_known_contexts[i].useless_p ())
3113           {
3114             m_known_contexts = ctx.m_known_contexts.copy ();
3115             break;
3116           }
3117     }
3118
3119   m_known_aggs = vNULL;
3120   if (ctx.m_known_aggs.exists ())
3121     {
3122       unsigned int n = MIN (ctx.m_known_aggs.length (), nargs);
3123
3124       for (unsigned int i = 0; i < n; i++)
3125         if (ipa_is_param_used_by_indirect_call (params_summary, i)
3126             && !ctx.m_known_aggs[i].is_empty ())
3127           {
3128             m_known_aggs = ipa_copy_agg_values (ctx.m_known_aggs);
3129             break;
3130           }
3131     }
3132 }
3133
3134 /* Release memory used by known_vals/contexts/aggs vectors.
3135    If ALL is true release also inline_param_summary.
3136    This happens when context was previously duplciated to be stored
3137    into cache.  */
3138
3139 void
3140 ipa_call_context::release (bool all)
3141 {
3142   /* See if context is initialized at first place.  */
3143   if (!m_node)
3144     return;
3145   m_known_vals.release ();
3146   m_known_contexts.release ();
3147   ipa_release_agg_values (m_known_aggs);
3148   if (all)
3149     m_inline_param_summary.release ();
3150 }
3151
3152 /* Return true if CTX describes the same call context as THIS.  */
3153
3154 bool
3155 ipa_call_context::equal_to (const ipa_call_context &ctx)
3156 {
3157   if (m_node != ctx.m_node
3158       || m_possible_truths != ctx.m_possible_truths
3159       || m_nonspec_possible_truths != ctx.m_nonspec_possible_truths)
3160     return false;
3161
3162   class ipa_node_params *params_summary = IPA_NODE_REF (m_node);
3163   unsigned int nargs = params_summary
3164                        ? ipa_get_param_count (params_summary) : 0;
3165
3166   if (m_inline_param_summary.exists () || ctx.m_inline_param_summary.exists ())
3167     {
3168       for (unsigned int i = 0; i < nargs; i++)
3169         {
3170           if (!ipa_is_param_used_by_ipa_predicates (params_summary, i))
3171             continue;
3172           if (i >= m_inline_param_summary.length ()
3173               || m_inline_param_summary[i].useless_p ())
3174             {
3175               if (i < ctx.m_inline_param_summary.length ()
3176                   && !ctx.m_inline_param_summary[i].useless_p ())
3177                 return false;
3178               continue;
3179             }
3180           if (i >= ctx.m_inline_param_summary.length ()
3181               || ctx.m_inline_param_summary[i].useless_p ())
3182             {
3183               if (i < m_inline_param_summary.length ()
3184                   && !m_inline_param_summary[i].useless_p ())
3185                 return false;
3186               continue;
3187             }
3188           if (!m_inline_param_summary[i].equal_to
3189                  (ctx.m_inline_param_summary[i]))
3190             return false;
3191         }
3192     }
3193   if (m_known_vals.exists () || ctx.m_known_vals.exists ())
3194     {
3195       for (unsigned int i = 0; i < nargs; i++)
3196         {
3197           if (!ipa_is_param_used_by_indirect_call (params_summary, i))
3198             continue;
3199           if (i >= m_known_vals.length () || !m_known_vals[i])
3200             {
3201               if (i < ctx.m_known_vals.length () && ctx.m_known_vals[i])
3202                 return false;
3203               continue;
3204             }
3205           if (i >= ctx.m_known_vals.length () || !ctx.m_known_vals[i])
3206             {
3207               if (i < m_known_vals.length () && m_known_vals[i])
3208                 return false;
3209               continue;
3210             }
3211           if (m_known_vals[i] != ctx.m_known_vals[i])
3212             return false;
3213         }
3214     }
3215   if (m_known_contexts.exists () || ctx.m_known_contexts.exists ())
3216     {
3217       for (unsigned int i = 0; i < nargs; i++)
3218         {
3219           if (!ipa_is_param_used_by_polymorphic_call (params_summary, i))
3220             continue;
3221           if (i >= m_known_contexts.length ()
3222               || m_known_contexts[i].useless_p ())
3223             {
3224               if (i < ctx.m_known_contexts.length ()
3225                   && !ctx.m_known_contexts[i].useless_p ())
3226                 return false;
3227               continue;
3228             }
3229           if (i >= ctx.m_known_contexts.length ()
3230               || ctx.m_known_contexts[i].useless_p ())
3231             {
3232               if (i < m_known_contexts.length ()
3233                   && !m_known_contexts[i].useless_p ())
3234                 return false;
3235               continue;
3236             }
3237           if (!m_known_contexts[i].equal_to
3238                  (ctx.m_known_contexts[i]))
3239             return false;
3240         }
3241     }
3242   if (m_known_aggs.exists () || ctx.m_known_aggs.exists ())
3243     {
3244       for (unsigned int i = 0; i < nargs; i++)
3245         {
3246           if (!ipa_is_param_used_by_indirect_call (params_summary, i))
3247             continue;
3248           if (i >= m_known_aggs.length () || m_known_aggs[i].is_empty ())
3249             {
3250               if (i < ctx.m_known_aggs.length ()
3251                   && !ctx.m_known_aggs[i].is_empty ())
3252                 return false;
3253               continue;
3254             }
3255           if (i >= ctx.m_known_aggs.length ()
3256               || ctx.m_known_aggs[i].is_empty ())
3257             {
3258               if (i < m_known_aggs.length ()
3259                   && !m_known_aggs[i].is_empty ())
3260                 return false;
3261               continue;
3262             }
3263           if (!m_known_aggs[i].equal_to (ctx.m_known_aggs[i]))
3264             return false;
3265         }
3266     }
3267   return true;
3268 }
3269
3270 /* Estimate size and time needed to execute call in the given context.
3271    Additionally detemine hints determined by the context.  Finally compute
3272    minimal size needed for the call that is independent on the call context and
3273    can be used for fast estimates.  Return the values in RET_SIZE,
3274    RET_MIN_SIZE, RET_TIME and RET_HINTS.  */
3275
3276 void
3277 ipa_call_context::estimate_size_and_time (int *ret_size,
3278                                           int *ret_min_size,
3279                                           sreal *ret_time,
3280                                           sreal *ret_nonspecialized_time,
3281                                           ipa_hints *ret_hints)
3282 {
3283   class ipa_fn_summary *info = ipa_fn_summaries->get (m_node);
3284   size_time_entry *e;
3285   int size = 0;
3286   sreal time = 0;
3287   int min_size = 0;
3288   ipa_hints hints = 0;
3289   int i;
3290
3291   if (dump_file && (dump_flags & TDF_DETAILS))
3292     {
3293       bool found = false;
3294       fprintf (dump_file, "   Estimating body: %s/%i\n"
3295                "   Known to be false: ", m_node->name (),
3296                m_node->order);
3297
3298       for (i = predicate::not_inlined_condition;
3299            i < (predicate::first_dynamic_condition
3300                 + (int) vec_safe_length (info->conds)); i++)
3301         if (!(m_possible_truths & (1 << i)))
3302           {
3303             if (found)
3304               fprintf (dump_file, ", ");
3305             found = true;
3306             dump_condition (dump_file, info->conds, i);
3307           }
3308     }
3309
3310   estimate_calls_size_and_time (m_node, &size, &min_size,
3311                                 ret_time ? &time : NULL,
3312                                 ret_hints ? &hints : NULL, m_possible_truths,
3313                                 m_known_vals, m_known_contexts, m_known_aggs);
3314
3315   sreal nonspecialized_time = time;
3316
3317   min_size += (*info->size_time_table)[0].size;
3318   for (i = 0; vec_safe_iterate (info->size_time_table, i, &e); i++)
3319     {
3320       bool exec = e->exec_predicate.evaluate (m_nonspec_possible_truths);
3321
3322       /* Because predicates are conservative, it can happen that nonconst is 1
3323          but exec is 0.  */
3324       if (exec)
3325         {
3326           bool nonconst = e->nonconst_predicate.evaluate (m_possible_truths);
3327
3328           gcc_checking_assert (e->time >= 0);
3329           gcc_checking_assert (time >= 0);
3330
3331           /* We compute specialized size only because size of nonspecialized
3332              copy is context independent.
3333
3334              The difference between nonspecialized execution and specialized is
3335              that nonspecialized is not going to have optimized out computations
3336              known to be constant in a specialized setting.  */
3337           if (nonconst)
3338             size += e->size;
3339           if (!ret_time)
3340             continue;
3341           nonspecialized_time += e->time;
3342           if (!nonconst)
3343             ;
3344           else if (!m_inline_param_summary.exists ())
3345             {
3346               if (nonconst)
3347                 time += e->time;
3348             }
3349           else
3350             {
3351               int prob = e->nonconst_predicate.probability
3352                                                (info->conds, m_possible_truths,
3353                                                 m_inline_param_summary);
3354               gcc_checking_assert (prob >= 0);
3355               gcc_checking_assert (prob <= REG_BR_PROB_BASE);
3356               if (prob == REG_BR_PROB_BASE)
3357                 time += e->time;
3358               else
3359                 time += e->time * prob / REG_BR_PROB_BASE;
3360             }
3361           gcc_checking_assert (time >= 0);
3362         }
3363      }
3364   gcc_checking_assert ((*info->size_time_table)[0].exec_predicate == true);
3365   gcc_checking_assert ((*info->size_time_table)[0].nonconst_predicate == true);
3366   gcc_checking_assert (min_size >= 0);
3367   gcc_checking_assert (size >= 0);
3368   gcc_checking_assert (time >= 0);
3369   /* nonspecialized_time should be always bigger than specialized time.
3370      Roundoff issues however may get into the way.  */
3371   gcc_checking_assert ((nonspecialized_time - time * 99 / 100) >= -1);
3372
3373   /* Roundoff issues may make specialized time bigger than nonspecialized
3374      time.  We do not really want that to happen because some heurstics
3375      may get confused by seeing negative speedups.  */
3376   if (time > nonspecialized_time)
3377     time = nonspecialized_time;
3378
3379   if (ret_hints)
3380     {
3381       if (info->loop_iterations
3382           && !info->loop_iterations->evaluate (m_possible_truths))
3383         hints |= INLINE_HINT_loop_iterations;
3384       if (info->loop_stride
3385           && !info->loop_stride->evaluate (m_possible_truths))
3386         hints |= INLINE_HINT_loop_stride;
3387       if (info->scc_no)
3388         hints |= INLINE_HINT_in_scc;
3389       if (DECL_DECLARED_INLINE_P (m_node->decl))
3390         hints |= INLINE_HINT_declared_inline;
3391     }
3392
3393   size = RDIV (size, ipa_fn_summary::size_scale);
3394   min_size = RDIV (min_size, ipa_fn_summary::size_scale);
3395
3396   if (dump_file && (dump_flags & TDF_DETAILS))
3397     fprintf (dump_file, "\n   size:%i time:%f nonspec time:%f\n", (int) size,
3398              time.to_double (), nonspecialized_time.to_double ());
3399   if (ret_time)
3400     *ret_time = time;
3401   if (ret_nonspecialized_time)
3402     *ret_nonspecialized_time = nonspecialized_time;
3403   if (ret_size)
3404     *ret_size = size;
3405   if (ret_min_size)
3406     *ret_min_size = min_size;
3407   if (ret_hints)
3408     *ret_hints = hints;
3409   return;
3410 }
3411
3412
3413 /* Estimate size and time needed to execute callee of EDGE assuming that
3414    parameters known to be constant at caller of EDGE are propagated.
3415    KNOWN_VALS and KNOWN_CONTEXTS are vectors of assumed known constant values
3416    and types for parameters.  */
3417
3418 void
3419 estimate_ipcp_clone_size_and_time (struct cgraph_node *node,
3420                                    vec<tree> known_vals,
3421                                    vec<ipa_polymorphic_call_context>
3422                                    known_contexts,
3423                                    vec<ipa_agg_value_set> known_aggs,
3424                                    int *ret_size, sreal *ret_time,
3425                                    sreal *ret_nonspec_time,
3426                                    ipa_hints *hints)
3427 {
3428   clause_t clause, nonspec_clause;
3429
3430   /* TODO: Also pass known value ranges.  */
3431   evaluate_conditions_for_known_args (node, false, known_vals, vNULL,
3432                                       known_aggs, &clause, &nonspec_clause);
3433   ipa_call_context ctx (node, clause, nonspec_clause,
3434                         known_vals, known_contexts,
3435                         known_aggs, vNULL);
3436   ctx.estimate_size_and_time (ret_size, NULL, ret_time,
3437                               ret_nonspec_time, hints);
3438 }
3439
3440 /* Return stack frame offset where frame of NODE is supposed to start inside
3441    of the function it is inlined to.
3442    Return 0 for functions that are not inlined.  */
3443
3444 HOST_WIDE_INT
3445 ipa_get_stack_frame_offset (struct cgraph_node *node)
3446 {
3447   HOST_WIDE_INT offset = 0;
3448   if (!node->inlined_to)
3449     return 0;
3450   node = node->callers->caller;
3451   while (true)
3452     {
3453       offset += ipa_size_summaries->get (node)->estimated_self_stack_size;
3454       if (!node->inlined_to)
3455         return offset;
3456       node = node->callers->caller;
3457     }
3458 }
3459
3460
3461 /* Update summary information of inline clones after inlining.
3462    Compute peak stack usage.  */
3463
3464 static void
3465 inline_update_callee_summaries (struct cgraph_node *node, int depth)
3466 {
3467   struct cgraph_edge *e;
3468
3469   ipa_propagate_frequency (node);
3470   for (e = node->callees; e; e = e->next_callee)
3471     {
3472       if (!e->inline_failed)
3473         inline_update_callee_summaries (e->callee, depth);
3474       else
3475         ipa_call_summaries->get (e)->loop_depth += depth;
3476     }
3477   for (e = node->indirect_calls; e; e = e->next_callee)
3478     ipa_call_summaries->get (e)->loop_depth += depth;
3479 }
3480
3481 /* Update change_prob of EDGE after INLINED_EDGE has been inlined.
3482    When function A is inlined in B and A calls C with parameter that
3483    changes with probability PROB1 and C is known to be passthroug
3484    of argument if B that change with probability PROB2, the probability
3485    of change is now PROB1*PROB2.  */
3486
3487 static void
3488 remap_edge_change_prob (struct cgraph_edge *inlined_edge,
3489                         struct cgraph_edge *edge)
3490 {
3491   if (ipa_node_params_sum)
3492     {
3493       int i;
3494       class ipa_edge_args *args = IPA_EDGE_REF (edge);
3495       if (!args)
3496         return;
3497       class ipa_call_summary *es = ipa_call_summaries->get (edge);
3498       class ipa_call_summary *inlined_es
3499         = ipa_call_summaries->get (inlined_edge);
3500
3501       if (es->param.length () == 0)
3502         return;
3503
3504       for (i = 0; i < ipa_get_cs_argument_count (args); i++)
3505         {
3506           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3507           if (jfunc->type == IPA_JF_PASS_THROUGH
3508               || jfunc->type == IPA_JF_ANCESTOR)
3509             {
3510               int id = jfunc->type == IPA_JF_PASS_THROUGH
3511                        ? ipa_get_jf_pass_through_formal_id (jfunc)
3512                        : ipa_get_jf_ancestor_formal_id (jfunc);
3513               if (id < (int) inlined_es->param.length ())
3514                 {
3515                   int prob1 = es->param[i].change_prob;
3516                   int prob2 = inlined_es->param[id].change_prob;
3517                   int prob = combine_probabilities (prob1, prob2);
3518
3519                   if (prob1 && prob2 && !prob)
3520                     prob = 1;
3521
3522                   es->param[i].change_prob = prob;
3523                 }
3524             }
3525         }
3526     }
3527 }
3528
3529 /* Update edge summaries of NODE after INLINED_EDGE has been inlined.
3530
3531    Remap predicates of callees of NODE.  Rest of arguments match
3532    remap_predicate.
3533
3534    Also update change probabilities.  */
3535
3536 static void
3537 remap_edge_summaries (struct cgraph_edge *inlined_edge,
3538                       struct cgraph_node *node,
3539                       class ipa_fn_summary *info,
3540                       class ipa_node_params *params_summary,
3541                       class ipa_fn_summary *callee_info,
3542                       vec<int> operand_map,
3543                       vec<int> offset_map,
3544                       clause_t possible_truths,
3545                       predicate *toplev_predicate)
3546 {
3547   struct cgraph_edge *e, *next;
3548   for (e = node->callees; e; e = next)
3549     {
3550       predicate p;
3551       next = e->next_callee;
3552
3553       if (e->inline_failed)
3554         {
3555           class ipa_call_summary *es = ipa_call_summaries->get (e);
3556           remap_edge_change_prob (inlined_edge, e);
3557
3558           if (es->predicate)
3559             {
3560               p = es->predicate->remap_after_inlining
3561                                      (info, params_summary,
3562                                       callee_info, operand_map,
3563                                       offset_map, possible_truths,
3564                                       *toplev_predicate);
3565               edge_set_predicate (e, &p);
3566             }
3567           else
3568             edge_set_predicate (e, toplev_predicate);
3569         }
3570       else
3571         remap_edge_summaries (inlined_edge, e->callee, info,
3572                               params_summary, callee_info,
3573                               operand_map, offset_map, possible_truths,
3574                               toplev_predicate);
3575     }
3576   for (e = node->indirect_calls; e; e = next)
3577     {
3578       class ipa_call_summary *es = ipa_call_summaries->get (e);
3579       predicate p;
3580       next = e->next_callee;
3581
3582       remap_edge_change_prob (inlined_edge, e);
3583       if (es->predicate)
3584         {
3585           p = es->predicate->remap_after_inlining
3586                                  (info, params_summary,
3587                                   callee_info, operand_map, offset_map,
3588                                   possible_truths, *toplev_predicate);
3589           edge_set_predicate (e, &p);
3590         }
3591       else
3592         edge_set_predicate (e, toplev_predicate);
3593     }
3594 }
3595
3596 /* Same as remap_predicate, but set result into hint *HINT.  */
3597
3598 static void
3599 remap_hint_predicate (class ipa_fn_summary *info,
3600                       class ipa_node_params *params_summary,
3601                       class ipa_fn_summary *callee_info,
3602                       predicate **hint,
3603                       vec<int> operand_map,
3604                       vec<int> offset_map,
3605                       clause_t possible_truths,
3606                       predicate *toplev_predicate)
3607 {
3608   predicate p;
3609
3610   if (!*hint)
3611     return;
3612   p = (*hint)->remap_after_inlining
3613                          (info, params_summary, callee_info,
3614                           operand_map, offset_map,
3615                           possible_truths, *toplev_predicate);
3616   if (p != false && p != true)
3617     {
3618       if (!*hint)
3619         set_hint_predicate (hint, p);
3620       else
3621         **hint &= p;
3622     }
3623 }
3624
3625 /* We inlined EDGE.  Update summary of the function we inlined into.  */
3626
3627 void
3628 ipa_merge_fn_summary_after_inlining (struct cgraph_edge *edge)
3629 {
3630   ipa_fn_summary *callee_info = ipa_fn_summaries->get (edge->callee);
3631   struct cgraph_node *to = (edge->caller->inlined_to
3632                             ? edge->caller->inlined_to : edge->caller);
3633   class ipa_fn_summary *info = ipa_fn_summaries->get (to);
3634   clause_t clause = 0;  /* not_inline is known to be false.  */
3635   size_time_entry *e;
3636   auto_vec<int, 8> operand_map;
3637   auto_vec<int, 8> offset_map;
3638   int i;
3639   predicate toplev_predicate;
3640   class ipa_call_summary *es = ipa_call_summaries->get (edge);
3641   class ipa_node_params *params_summary = (ipa_node_params_sum
3642                                            ? IPA_NODE_REF (to) : NULL);
3643
3644   if (es->predicate)
3645     toplev_predicate = *es->predicate;
3646   else
3647     toplev_predicate = true;
3648
3649   info->fp_expressions |= callee_info->fp_expressions;
3650
3651   if (callee_info->conds)
3652     evaluate_properties_for_edge (edge, true, &clause,
3653                                   NULL, NULL, NULL, NULL);
3654   if (ipa_node_params_sum && callee_info->conds)
3655     {
3656       class ipa_edge_args *args = IPA_EDGE_REF (edge);
3657       int count = args ? ipa_get_cs_argument_count (args) : 0;
3658       int i;
3659
3660       if (count)
3661         {
3662           operand_map.safe_grow_cleared (count);
3663           offset_map.safe_grow_cleared (count);
3664         }
3665       for (i = 0; i < count; i++)
3666         {
3667           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
3668           int map = -1;
3669
3670           /* TODO: handle non-NOPs when merging.  */
3671           if (jfunc->type == IPA_JF_PASS_THROUGH)
3672             {
3673               if (ipa_get_jf_pass_through_operation (jfunc) == NOP_EXPR)
3674                 map = ipa_get_jf_pass_through_formal_id (jfunc);
3675               if (!ipa_get_jf_pass_through_agg_preserved (jfunc))
3676                 offset_map[i] = -1;
3677             }
3678           else if (jfunc->type == IPA_JF_ANCESTOR)
3679             {
3680               HOST_WIDE_INT offset = ipa_get_jf_ancestor_offset (jfunc);
3681               if (offset >= 0 && offset < INT_MAX)
3682                 {
3683                   map = ipa_get_jf_ancestor_formal_id (jfunc);
3684                   if (!ipa_get_jf_ancestor_agg_preserved (jfunc))
3685                     offset = -1;
3686                   offset_map[i] = offset;
3687                 }
3688             }
3689           operand_map[i] = map;
3690           gcc_assert (map < ipa_get_param_count (params_summary));
3691         }
3692     }
3693   sreal freq =  edge->sreal_frequency ();
3694   for (i = 0; vec_safe_iterate (callee_info->size_time_table, i, &e); i++)
3695     {
3696       predicate p;
3697       p = e->exec_predicate.remap_after_inlining
3698                              (info, params_summary,
3699                               callee_info, operand_map,
3700                               offset_map, clause,
3701                               toplev_predicate);
3702       predicate nonconstp;
3703       nonconstp = e->nonconst_predicate.remap_after_inlining
3704                                      (info, params_summary,
3705                                       callee_info, operand_map,
3706                                       offset_map, clause,
3707                                       toplev_predicate);
3708       if (p != false && nonconstp != false)
3709         {
3710           sreal add_time = ((sreal)e->time * freq);
3711           int prob = e->nonconst_predicate.probability (callee_info->conds,
3712                                                         clause, es->param);
3713           if (prob != REG_BR_PROB_BASE)
3714             add_time = add_time * prob / REG_BR_PROB_BASE;
3715           if (prob != REG_BR_PROB_BASE
3716               && dump_file && (dump_flags & TDF_DETAILS))
3717             {
3718               fprintf (dump_file, "\t\tScaling time by probability:%f\n",
3719                        (double) prob / REG_BR_PROB_BASE);
3720             }
3721           info->account_size_time (e->size, add_time, p, nonconstp);
3722         }
3723     }
3724   remap_edge_summaries (edge, edge->callee, info, params_summary,
3725                         callee_info, operand_map,
3726                         offset_map, clause, &toplev_predicate);
3727   remap_hint_predicate (info, params_summary, callee_info,
3728                         &callee_info->loop_iterations,
3729                         operand_map, offset_map, clause, &toplev_predicate);
3730   remap_hint_predicate (info, params_summary, callee_info,
3731                         &callee_info->loop_stride,
3732                         operand_map, offset_map, clause, &toplev_predicate);
3733
3734   HOST_WIDE_INT stack_frame_offset = ipa_get_stack_frame_offset (edge->callee);
3735   HOST_WIDE_INT peak = stack_frame_offset + callee_info->estimated_stack_size;
3736
3737   if (info->estimated_stack_size < peak)
3738     info->estimated_stack_size = peak;
3739
3740   inline_update_callee_summaries (edge->callee, es->loop_depth);
3741
3742   /* Free summaries that are not maintained for inline clones/edges.  */
3743   ipa_call_summaries->remove (edge);
3744   ipa_fn_summaries->remove (edge->callee);
3745   ipa_remove_from_growth_caches (edge);
3746 }
3747
3748 /* For performance reasons ipa_merge_fn_summary_after_inlining is not updating
3749    overall size and time.  Recompute it.  */
3750
3751 void
3752 ipa_update_overall_fn_summary (struct cgraph_node *node)
3753 {
3754   class ipa_fn_summary *info = ipa_fn_summaries->get (node);
3755   class ipa_size_summary *size_info = ipa_size_summaries->get (node);
3756   size_time_entry *e;
3757   int i;
3758
3759   size_info->size = 0;
3760   info->time = 0;
3761   for (i = 0; vec_safe_iterate (info->size_time_table, i, &e); i++)
3762     {
3763       size_info->size += e->size;
3764       info->time += e->time;
3765     }
3766   info->min_size = (*info->size_time_table)[0].size;
3767   estimate_calls_size_and_time (node, &size_info->size, &info->min_size,
3768                                 &info->time, NULL,
3769                                 ~(clause_t) (1 << predicate::false_condition),
3770                                 vNULL, vNULL, vNULL);
3771   size_info->size = RDIV (size_info->size, ipa_fn_summary::size_scale);
3772   info->min_size = RDIV (info->min_size, ipa_fn_summary::size_scale);
3773 }
3774
3775
3776 /* This function performs intraprocedural analysis in NODE that is required to
3777    inline indirect calls.  */
3778
3779 static void
3780 inline_indirect_intraprocedural_analysis (struct cgraph_node *node)
3781 {
3782   ipa_analyze_node (node);
3783   if (dump_file && (dump_flags & TDF_DETAILS))
3784     {
3785       ipa_print_node_params (dump_file, node);
3786       ipa_print_node_jump_functions (dump_file, node);
3787     }
3788 }
3789
3790
3791 /* Note function body size.  */
3792
3793 void
3794 inline_analyze_function (struct cgraph_node *node)
3795 {
3796   push_cfun (DECL_STRUCT_FUNCTION (node->decl));
3797
3798   if (dump_file)
3799     fprintf (dump_file, "\nAnalyzing function: %s/%u\n",
3800              node->name (), node->order);
3801   if (opt_for_fn (node->decl, optimize) && !node->thunk.thunk_p)
3802     inline_indirect_intraprocedural_analysis (node);
3803   compute_fn_summary (node, false);
3804   if (!optimize)
3805     {
3806       struct cgraph_edge *e;
3807       for (e = node->callees; e; e = e->next_callee)
3808         e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
3809       for (e = node->indirect_calls; e; e = e->next_callee)
3810         e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
3811     }
3812
3813   pop_cfun ();
3814 }
3815
3816
3817 /* Called when new function is inserted to callgraph late.  */
3818
3819 void
3820 ipa_fn_summary_t::insert (struct cgraph_node *node, ipa_fn_summary *)
3821 {
3822   inline_analyze_function (node);
3823 }
3824
3825 /* Note function body size.  */
3826
3827 static void
3828 ipa_fn_summary_generate (void)
3829 {
3830   struct cgraph_node *node;
3831
3832   FOR_EACH_DEFINED_FUNCTION (node)
3833     if (DECL_STRUCT_FUNCTION (node->decl))
3834       node->versionable = tree_versionable_function_p (node->decl);
3835
3836   ipa_fn_summary_alloc ();
3837
3838   ipa_fn_summaries->enable_insertion_hook ();
3839
3840   ipa_register_cgraph_hooks ();
3841
3842   FOR_EACH_DEFINED_FUNCTION (node)
3843     if (!node->alias
3844         && (flag_generate_lto || flag_generate_offload|| flag_wpa
3845             || opt_for_fn (node->decl, optimize)))
3846       inline_analyze_function (node);
3847 }
3848
3849
3850 /* Write inline summary for edge E to OB.  */
3851
3852 static void
3853 read_ipa_call_summary (class lto_input_block *ib, struct cgraph_edge *e,
3854                        bool prevails)
3855 {
3856   class ipa_call_summary *es = prevails
3857                                 ? ipa_call_summaries->get_create (e) : NULL;
3858   predicate p;
3859   int length, i;
3860
3861   int size = streamer_read_uhwi (ib);
3862   int time = streamer_read_uhwi (ib);
3863   int depth = streamer_read_uhwi (ib);
3864
3865   if (es)
3866     {
3867       es->call_stmt_size = size;
3868       es->call_stmt_time = time;
3869       es->loop_depth = depth;
3870     }
3871
3872   bitpack_d bp = streamer_read_bitpack (ib);
3873   if (es)
3874     es->is_return_callee_uncaptured = bp_unpack_value (&bp, 1);
3875   else
3876     bp_unpack_value (&bp, 1);
3877
3878   p.stream_in (ib);
3879   if (es)
3880     edge_set_predicate (e, &p);
3881   length = streamer_read_uhwi (ib);
3882   if (length && es && e->possibly_call_in_translation_unit_p ())
3883     {
3884       es->param.safe_grow_cleared (length);
3885       for (i = 0; i < length; i++)
3886         es->param[i].change_prob = streamer_read_uhwi (ib);
3887     }
3888   else
3889     {
3890       for (i = 0; i < length; i++)
3891         streamer_read_uhwi (ib);
3892     }
3893 }
3894
3895
3896 /* Stream in inline summaries from the section.  */
3897
3898 static void
3899 inline_read_section (struct lto_file_decl_data *file_data, const char *data,
3900                      size_t len)
3901 {
3902   const struct lto_function_header *header =
3903     (const struct lto_function_header *) data;
3904   const int cfg_offset = sizeof (struct lto_function_header);
3905   const int main_offset = cfg_offset + header->cfg_size;
3906   const int string_offset = main_offset + header->main_size;
3907   class data_in *data_in;
3908   unsigned int i, count2, j;
3909   unsigned int f_count;
3910
3911   lto_input_block ib ((const char *) data + main_offset, header->main_size,
3912                       file_data->mode_table);
3913
3914   data_in =
3915     lto_data_in_create (file_data, (const char *) data + string_offset,
3916                         header->string_size, vNULL);
3917   f_count = streamer_read_uhwi (&ib);
3918   for (i = 0; i < f_count; i++)
3919     {
3920       unsigned int index;
3921       struct cgraph_node *node;
3922       class ipa_fn_summary *info;
3923       class ipa_node_params *params_summary;
3924       class ipa_size_summary *size_info;
3925       lto_symtab_encoder_t encoder;
3926       struct bitpack_d bp;
3927       struct cgraph_edge *e;
3928       predicate p;
3929
3930       index = streamer_read_uhwi (&ib);
3931       encoder = file_data->symtab_node_encoder;
3932       node = dyn_cast<cgraph_node *> (lto_symtab_encoder_deref (encoder,
3933                                                                 index));
3934       info = node->prevailing_p () ? ipa_fn_summaries->get_create (node) : NULL;
3935       params_summary = node->prevailing_p () ? IPA_NODE_REF (node) : NULL;
3936       size_info = node->prevailing_p ()
3937                   ? ipa_size_summaries->get_create (node) : NULL;
3938
3939       int stack_size = streamer_read_uhwi (&ib);
3940       int size = streamer_read_uhwi (&ib);
3941       sreal time = sreal::stream_in (&ib);
3942
3943       if (info)
3944         {
3945           info->estimated_stack_size
3946             = size_info->estimated_self_stack_size = stack_size;
3947           size_info->size = size_info->self_size = size;
3948           info->time = time;
3949         }
3950
3951       bp = streamer_read_bitpack (&ib);
3952       if (info)
3953         {
3954           info->inlinable = bp_unpack_value (&bp, 1);
3955           info->fp_expressions = bp_unpack_value (&bp, 1);
3956         }
3957       else
3958         {
3959           bp_unpack_value (&bp, 1);
3960           bp_unpack_value (&bp, 1);
3961         }
3962
3963       count2 = streamer_read_uhwi (&ib);
3964       gcc_assert (!info || !info->conds);
3965       if (info)
3966         vec_safe_reserve_exact (info->conds, count2);
3967       for (j = 0; j < count2; j++)
3968         {
3969           struct condition c;
3970           unsigned int k, count3;
3971           c.operand_num = streamer_read_uhwi (&ib);
3972           c.code = (enum tree_code) streamer_read_uhwi (&ib);
3973           c.type = stream_read_tree (&ib, data_in);
3974           c.val = stream_read_tree (&ib, data_in);
3975           bp = streamer_read_bitpack (&ib);
3976           c.agg_contents = bp_unpack_value (&bp, 1);
3977           c.by_ref = bp_unpack_value (&bp, 1);
3978           if (c.agg_contents)
3979             c.offset = streamer_read_uhwi (&ib);
3980           count3 = streamer_read_uhwi (&ib);
3981           c.param_ops = NULL;
3982           if (info)
3983             vec_safe_reserve_exact (c.param_ops, count3);
3984           if (params_summary)
3985             ipa_set_param_used_by_ipa_predicates
3986                     (params_summary, c.operand_num, true);
3987           for (k = 0; k < count3; k++)
3988             {
3989               struct expr_eval_op op;
3990               enum gimple_rhs_class rhs_class;
3991               op.code = (enum tree_code) streamer_read_uhwi (&ib);
3992               op.type = stream_read_tree (&ib, data_in);
3993               switch (rhs_class = get_gimple_rhs_class (op.code))
3994                 {
3995                 case GIMPLE_UNARY_RHS:
3996                   op.index = 0;
3997                   op.val[0] = NULL_TREE;
3998                   op.val[1] = NULL_TREE;
3999                   break;
4000
4001                 case GIMPLE_BINARY_RHS:
4002                 case GIMPLE_TERNARY_RHS:
4003                   bp = streamer_read_bitpack (&ib);
4004                   op.index = bp_unpack_value (&bp, 2);
4005                   op.val[0] = stream_read_tree (&ib, data_in);
4006                   if (rhs_class == GIMPLE_BINARY_RHS)
4007                     op.val[1] = NULL_TREE;
4008                   else
4009                     op.val[1] = stream_read_tree (&ib, data_in);
4010                   break;
4011
4012                 default:
4013                   fatal_error (UNKNOWN_LOCATION,
4014                                "invalid fnsummary in LTO stream");
4015                 }
4016               if (info)
4017                 c.param_ops->quick_push (op);
4018             }
4019           if (info)
4020             info->conds->quick_push (c);
4021         }
4022       count2 = streamer_read_uhwi (&ib);
4023       gcc_assert (!info || !info->size_time_table);
4024       if (info && count2)
4025         vec_safe_reserve_exact (info->size_time_table, count2);
4026       for (j = 0; j < count2; j++)
4027         {
4028           class size_time_entry e;
4029
4030           e.size = streamer_read_uhwi (&ib);
4031           e.time = sreal::stream_in (&ib);
4032           e.exec_predicate.stream_in (&ib);
4033           e.nonconst_predicate.stream_in (&ib);
4034
4035           if (info)
4036             info->size_time_table->quick_push (e);
4037         }
4038
4039       p.stream_in (&ib);
4040       if (info)
4041         set_hint_predicate (&info->loop_iterations, p);
4042       p.stream_in (&ib);
4043       if (info)
4044         set_hint_predicate (&info->loop_stride, p);
4045       for (e = node->callees; e; e = e->next_callee)
4046         read_ipa_call_summary (&ib, e, info != NULL);
4047       for (e = node->indirect_calls; e; e = e->next_callee)
4048         read_ipa_call_summary (&ib, e, info != NULL);
4049     }
4050
4051   lto_free_section_data (file_data, LTO_section_ipa_fn_summary, NULL, data,
4052                          len);
4053   lto_data_in_delete (data_in);
4054 }
4055
4056
4057 /* Read inline summary.  Jump functions are shared among ipa-cp
4058    and inliner, so when ipa-cp is active, we don't need to write them
4059    twice.  */
4060
4061 static void
4062 ipa_fn_summary_read (void)
4063 {
4064   struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
4065   struct lto_file_decl_data *file_data;
4066   unsigned int j = 0;
4067
4068   ipa_fn_summary_alloc ();
4069
4070   while ((file_data = file_data_vec[j++]))
4071     {
4072       size_t len;
4073       const char *data
4074         = lto_get_summary_section_data (file_data, LTO_section_ipa_fn_summary,
4075                                         &len);
4076       if (data)
4077         inline_read_section (file_data, data, len);
4078       else
4079         /* Fatal error here.  We do not want to support compiling ltrans units
4080            with different version of compiler or different flags than the WPA
4081            unit, so this should never happen.  */
4082         fatal_error (input_location,
4083                      "ipa inline summary is missing in input file");
4084     }
4085   ipa_register_cgraph_hooks ();
4086   if (!flag_ipa_cp)
4087     ipa_prop_read_jump_functions ();
4088
4089   gcc_assert (ipa_fn_summaries);
4090   ipa_fn_summaries->enable_insertion_hook ();
4091 }
4092
4093
4094 /* Write inline summary for edge E to OB.  */
4095
4096 static void
4097 write_ipa_call_summary (struct output_block *ob, struct cgraph_edge *e)
4098 {
4099   class ipa_call_summary *es = ipa_call_summaries->get (e);
4100   int i;
4101
4102   streamer_write_uhwi (ob, es->call_stmt_size);
4103   streamer_write_uhwi (ob, es->call_stmt_time);
4104   streamer_write_uhwi (ob, es->loop_depth);
4105
4106   bitpack_d bp = bitpack_create (ob->main_stream);
4107   bp_pack_value (&bp, es->is_return_callee_uncaptured, 1);
4108   streamer_write_bitpack (&bp);
4109
4110   if (es->predicate)
4111     es->predicate->stream_out (ob);
4112   else
4113     streamer_write_uhwi (ob, 0);
4114   streamer_write_uhwi (ob, es->param.length ());
4115   for (i = 0; i < (int) es->param.length (); i++)
4116     streamer_write_uhwi (ob, es->param[i].change_prob);
4117 }
4118
4119
4120 /* Write inline summary for node in SET.
4121    Jump functions are shared among ipa-cp and inliner, so when ipa-cp is
4122    active, we don't need to write them twice.  */
4123
4124 static void
4125 ipa_fn_summary_write (void)
4126 {
4127   struct output_block *ob = create_output_block (LTO_section_ipa_fn_summary);
4128   lto_symtab_encoder_t encoder = ob->decl_state->symtab_node_encoder;
4129   unsigned int count = 0;
4130   int i;
4131
4132   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4133     {
4134       symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
4135       cgraph_node *cnode = dyn_cast <cgraph_node *> (snode);
4136       if (cnode && cnode->definition && !cnode->alias)
4137         count++;
4138     }
4139   streamer_write_uhwi (ob, count);
4140
4141   for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
4142     {
4143       symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
4144       cgraph_node *cnode = dyn_cast <cgraph_node *> (snode);
4145       if (cnode && cnode->definition && !cnode->alias)
4146         {
4147           class ipa_fn_summary *info = ipa_fn_summaries->get (cnode);
4148           class ipa_size_summary *size_info = ipa_size_summaries->get (cnode);
4149           struct bitpack_d bp;
4150           struct cgraph_edge *edge;
4151           int i;
4152           size_time_entry *e;
4153           struct condition *c;
4154
4155           streamer_write_uhwi (ob, lto_symtab_encoder_encode (encoder, cnode));
4156           streamer_write_hwi (ob, size_info->estimated_self_stack_size);
4157           streamer_write_hwi (ob, size_info->self_size);
4158           info->time.stream_out (ob);
4159           bp = bitpack_create (ob->main_stream);
4160           bp_pack_value (&bp, info->inlinable, 1);
4161           bp_pack_value (&bp, false, 1);
4162           bp_pack_value (&bp, info->fp_expressions, 1);
4163           streamer_write_bitpack (&bp);
4164           streamer_write_uhwi (ob, vec_safe_length (info->conds));
4165           for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
4166             {
4167               int j;
4168               struct expr_eval_op *op;
4169
4170               streamer_write_uhwi (ob, c->operand_num);
4171               streamer_write_uhwi (ob, c->code);
4172               stream_write_tree (ob, c->type, true);
4173               stream_write_tree (ob, c->val, true);
4174               bp = bitpack_create (ob->main_stream);
4175               bp_pack_value (&bp, c->agg_contents, 1);
4176               bp_pack_value (&bp, c->by_ref, 1);
4177               streamer_write_bitpack (&bp);
4178               if (c->agg_contents)
4179                 streamer_write_uhwi (ob, c->offset);
4180               streamer_write_uhwi (ob, vec_safe_length (c->param_ops));
4181               for (j = 0; vec_safe_iterate (c->param_ops, j, &op); j++)
4182                 {
4183                   streamer_write_uhwi (ob, op->code);
4184                   stream_write_tree (ob, op->type, true);
4185                   if (op->val[0])
4186                     {
4187                       bp = bitpack_create (ob->main_stream);
4188                       bp_pack_value (&bp, op->index, 2);
4189                       streamer_write_bitpack (&bp);
4190                       stream_write_tree (ob, op->val[0], true);
4191                       if (op->val[1])
4192                         stream_write_tree (ob, op->val[1], true);
4193                     }
4194                 }
4195             }
4196           streamer_write_uhwi (ob, vec_safe_length (info->size_time_table));
4197           for (i = 0; vec_safe_iterate (info->size_time_table, i, &e); i++)
4198             {
4199               streamer_write_uhwi (ob, e->size);
4200               e->time.stream_out (ob);
4201               e->exec_predicate.stream_out (ob);
4202               e->nonconst_predicate.stream_out (ob);
4203             }
4204           if (info->loop_iterations)
4205             info->loop_iterations->stream_out (ob);
4206           else
4207             streamer_write_uhwi (ob, 0);
4208           if (info->loop_stride)
4209             info->loop_stride->stream_out (ob);
4210           else
4211             streamer_write_uhwi (ob, 0);
4212           for (edge = cnode->callees; edge; edge = edge->next_callee)
4213             write_ipa_call_summary (ob, edge);
4214           for (edge = cnode->indirect_calls; edge; edge = edge->next_callee)
4215             write_ipa_call_summary (ob, edge);
4216         }
4217     }
4218   streamer_write_char_stream (ob->main_stream, 0);
4219   produce_asm (ob, NULL);
4220   destroy_output_block (ob);
4221
4222   if (!flag_ipa_cp)
4223     ipa_prop_write_jump_functions ();
4224 }
4225
4226
4227 /* Release function summary.  */
4228
4229 void
4230 ipa_free_fn_summary (void)
4231 {
4232   if (!ipa_call_summaries)
4233     return;
4234   ggc_delete (ipa_fn_summaries);
4235   ipa_fn_summaries = NULL;
4236   delete ipa_call_summaries;
4237   ipa_call_summaries = NULL;
4238   edge_predicate_pool.release ();
4239   /* During IPA this is one of largest datastructures to release.  */
4240   if (flag_wpa)
4241     ggc_trim ();
4242 }
4243
4244 /* Release function summary.  */
4245
4246 void
4247 ipa_free_size_summary (void)
4248 {
4249   if (!ipa_size_summaries)
4250     return;
4251   delete ipa_size_summaries;
4252   ipa_size_summaries = NULL;
4253 }
4254
4255 namespace {
4256
4257 const pass_data pass_data_local_fn_summary =
4258 {
4259   GIMPLE_PASS, /* type */
4260   "local-fnsummary", /* name */
4261   OPTGROUP_INLINE, /* optinfo_flags */
4262   TV_INLINE_PARAMETERS, /* tv_id */
4263   0, /* properties_required */
4264   0, /* properties_provided */
4265   0, /* properties_destroyed */
4266   0, /* todo_flags_start */
4267   0, /* todo_flags_finish */
4268 };
4269
4270 class pass_local_fn_summary : public gimple_opt_pass
4271 {
4272 public:
4273   pass_local_fn_summary (gcc::context *ctxt)
4274     : gimple_opt_pass (pass_data_local_fn_summary, ctxt)
4275   {}
4276
4277   /* opt_pass methods: */
4278   opt_pass * clone () { return new pass_local_fn_summary (m_ctxt); }
4279   virtual unsigned int execute (function *)
4280     {
4281       return compute_fn_summary_for_current ();
4282     }
4283
4284 }; // class pass_local_fn_summary
4285
4286 } // anon namespace
4287
4288 gimple_opt_pass *
4289 make_pass_local_fn_summary (gcc::context *ctxt)
4290 {
4291   return new pass_local_fn_summary (ctxt);
4292 }
4293
4294
4295 /* Free inline summary.  */
4296
4297 namespace {
4298
4299 const pass_data pass_data_ipa_free_fn_summary =
4300 {
4301   SIMPLE_IPA_PASS, /* type */
4302   "free-fnsummary", /* name */
4303   OPTGROUP_NONE, /* optinfo_flags */
4304   TV_IPA_FREE_INLINE_SUMMARY, /* tv_id */
4305   0, /* properties_required */
4306   0, /* properties_provided */
4307   0, /* properties_destroyed */
4308   0, /* todo_flags_start */
4309   0, /* todo_flags_finish */
4310 };
4311
4312 class pass_ipa_free_fn_summary : public simple_ipa_opt_pass
4313 {
4314 public:
4315   pass_ipa_free_fn_summary (gcc::context *ctxt)
4316     : simple_ipa_opt_pass (pass_data_ipa_free_fn_summary, ctxt),
4317       small_p (false)
4318   {}
4319
4320   /* opt_pass methods: */
4321   opt_pass *clone () { return new pass_ipa_free_fn_summary (m_ctxt); }
4322   void set_pass_param (unsigned int n, bool param)
4323     {
4324       gcc_assert (n == 0);
4325       small_p = param;
4326     }
4327   virtual bool gate (function *) { return true; }
4328   virtual unsigned int execute (function *)
4329     {
4330       ipa_free_fn_summary ();
4331       if (!flag_wpa)
4332         ipa_free_size_summary ();
4333       return 0;
4334     }
4335
4336 private:
4337   bool small_p;
4338 }; // class pass_ipa_free_fn_summary
4339
4340 } // anon namespace
4341
4342 simple_ipa_opt_pass *
4343 make_pass_ipa_free_fn_summary (gcc::context *ctxt)
4344 {
4345   return new pass_ipa_free_fn_summary (ctxt);
4346 }
4347
4348 namespace {
4349
4350 const pass_data pass_data_ipa_fn_summary =
4351 {
4352   IPA_PASS, /* type */
4353   "fnsummary", /* name */
4354   OPTGROUP_INLINE, /* optinfo_flags */
4355   TV_IPA_FNSUMMARY, /* tv_id */
4356   0, /* properties_required */
4357   0, /* properties_provided */
4358   0, /* properties_destroyed */
4359   0, /* todo_flags_start */
4360   ( TODO_dump_symtab ), /* todo_flags_finish */
4361 };
4362
4363 class pass_ipa_fn_summary : public ipa_opt_pass_d
4364 {
4365 public:
4366   pass_ipa_fn_summary (gcc::context *ctxt)
4367     : ipa_opt_pass_d (pass_data_ipa_fn_summary, ctxt,
4368                       ipa_fn_summary_generate, /* generate_summary */
4369                       ipa_fn_summary_write, /* write_summary */
4370                       ipa_fn_summary_read, /* read_summary */
4371                       NULL, /* write_optimization_summary */
4372                       NULL, /* read_optimization_summary */
4373                       NULL, /* stmt_fixup */
4374                       0, /* function_transform_todo_flags_start */
4375                       NULL, /* function_transform */
4376                       NULL) /* variable_transform */
4377   {}
4378
4379   /* opt_pass methods: */
4380   virtual unsigned int execute (function *) { return 0; }
4381
4382 }; // class pass_ipa_fn_summary
4383
4384 } // anon namespace
4385
4386 ipa_opt_pass_d *
4387 make_pass_ipa_fn_summary (gcc::context *ctxt)
4388 {
4389   return new pass_ipa_fn_summary (ctxt);
4390 }
4391
4392 /* Reset all state within ipa-fnsummary.c so that we can rerun the compiler
4393    within the same process.  For use by toplev::finalize.  */
4394
4395 void
4396 ipa_fnsummary_c_finalize (void)
4397 {
4398   ipa_free_fn_summary ();
4399 }