gcc/ipa-fnsummary.cc

   1 /* Function summary pass.
   2    Copyright (C) 2003-2024 Free Software Foundation, Inc.
   3    Contributed by Jan Hubicka
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* Analysis of function bodies used by inter-procedural passes
  22
  23    We estimate for each function
  24      - function body size and size after specializing into given context
  25      - average function execution time in a given context
  26      - function frame size
  27    For each call
  28      - call statement size, time and how often the parameters change
  29
  30    ipa_fn_summary data structures store above information locally (i.e.
  31    parameters of the function itself) and globally (i.e. parameters of
  32    the function created by applying all the inline decisions already
  33    present in the callgraph).
  34
  35    We provide access to the ipa_fn_summary data structure and
  36    basic logic updating the parameters when inlining is performed.
  37
  38    The summaries are context sensitive.  Context means
  39      1) partial assignment of known constant values of operands
  40      2) whether function is inlined into the call or not.
  41    It is easy to add more variants.  To represent function size and time
  42    that depends on context (i.e. it is known to be optimized away when
  43    context is known either by inlining or from IP-CP and cloning),
  44    we use predicates.
  45
  46    estimate_edge_size_and_time can be used to query
  47    function size/time in the given context.  ipa_merge_fn_summary_after_inlining merges
  48    properties of caller and callee after inlining.
  49
  50    Finally pass_inline_parameters is exported.  This is used to drive
  51    computation of function parameters used by the early inliner. IPA
  52    inlined performs analysis via its analyze_function method. */
  53
  54 #include "config.h"
  55 #define INCLUDE_VECTOR
  56 #include "system.h"
  57 #include "coretypes.h"
  58 #include "backend.h"
  59 #include "target.h"
  60 #include "tree.h"
  61 #include "gimple.h"
  62 #include "alloc-pool.h"
  63 #include "tree-pass.h"
  64 #include "ssa.h"
  65 #include "tree-streamer.h"
  66 #include "cgraph.h"
  67 #include "diagnostic.h"
  68 #include "fold-const.h"
  69 #include "print-tree.h"
  70 #include "tree-inline.h"
  71 #include "gimple-pretty-print.h"
  72 #include "cfganal.h"
  73 #include "gimple-iterator.h"
  74 #include "tree-cfg.h"
  75 #include "tree-ssa-loop-niter.h"
  76 #include "tree-ssa-loop.h"
  77 #include "symbol-summary.h"
  78 #include "sreal.h"
  79 #include "ipa-cp.h"
  80 #include "ipa-prop.h"
  81 #include "ipa-fnsummary.h"
  82 #include "cfgloop.h"
  83 #include "tree-scalar-evolution.h"
  84 #include "ipa-utils.h"
  85 #include "cfgexpand.h"
  86 #include "gimplify.h"
  87 #include "stringpool.h"
  88 #include "attribs.h"
  89 #include "tree-into-ssa.h"
  90 #include "symtab-clones.h"
  91 #include "gimple-range.h"
  92 #include "tree-dfa.h"
  93
  94 /* Summaries.  */
  95 fast_function_summary <ipa_fn_summary *, va_gc> *ipa_fn_summaries;
  96 fast_function_summary <ipa_size_summary *, va_heap> *ipa_size_summaries;
  97 fast_call_summary <ipa_call_summary *, va_heap> *ipa_call_summaries;
  98
  99 /* Edge predicates goes here.  */
 100 static object_allocator<ipa_predicate> edge_predicate_pool ("edge predicates");
 101
 102
 103 /* Dump IPA hints.  */
 104 void
 105 ipa_dump_hints (FILE *f, ipa_hints hints)
 106 {
 107   if (!hints)
 108     return;
 109   fprintf (f, "IPA hints:");
 110   if (hints & INLINE_HINT_indirect_call)
 111     {
 112       hints &= ~INLINE_HINT_indirect_call;
 113       fprintf (f, " indirect_call");
 114     }
 115   if (hints & INLINE_HINT_loop_iterations)
 116     {
 117       hints &= ~INLINE_HINT_loop_iterations;
 118       fprintf (f, " loop_iterations");
 119     }
 120   if (hints & INLINE_HINT_loop_stride)
 121     {
 122       hints &= ~INLINE_HINT_loop_stride;
 123       fprintf (f, " loop_stride");
 124     }
 125   if (hints & INLINE_HINT_same_scc)
 126     {
 127       hints &= ~INLINE_HINT_same_scc;
 128       fprintf (f, " same_scc");
 129     }
 130   if (hints & INLINE_HINT_in_scc)
 131     {
 132       hints &= ~INLINE_HINT_in_scc;
 133       fprintf (f, " in_scc");
 134     }
 135   if (hints & INLINE_HINT_cross_module)
 136     {
 137       hints &= ~INLINE_HINT_cross_module;
 138       fprintf (f, " cross_module");
 139     }
 140   if (hints & INLINE_HINT_declared_inline)
 141     {
 142       hints &= ~INLINE_HINT_declared_inline;
 143       fprintf (f, " declared_inline");
 144     }
 145   if (hints & INLINE_HINT_known_hot)
 146     {
 147       hints &= ~INLINE_HINT_known_hot;
 148       fprintf (f, " known_hot");
 149     }
 150   if (hints & INLINE_HINT_builtin_constant_p)
 151     {
 152       hints &= ~INLINE_HINT_builtin_constant_p;
 153       fprintf (f, " builtin_constant_p");
 154     }
 155   gcc_assert (!hints);
 156 }
 157
 158
 159 /* Record SIZE and TIME to SUMMARY.
 160    The accounted code will be executed when EXEC_PRED is true.
 161    When NONCONST_PRED is false the code will evaluate to constant and
 162    will get optimized out in specialized clones of the function.
 163    If CALL is true account to call_size_time_table rather than
 164    size_time_table.   */
 165
 166 void
 167 ipa_fn_summary::account_size_time (int size, sreal time,
 168                                    const ipa_predicate &exec_pred,
 169                                    const ipa_predicate &nonconst_pred_in,
 170                                    bool call)
 171 {
 172   size_time_entry *e;
 173   bool found = false;
 174   int i;
 175   ipa_predicate nonconst_pred;
 176   vec<size_time_entry> *table = call ? &call_size_time_table : &size_time_table;
 177
 178   if (exec_pred == false)
 179     return;
 180
 181   nonconst_pred = nonconst_pred_in & exec_pred;
 182
 183   if (nonconst_pred == false)
 184     return;
 185
 186   /* We need to create initial empty unconditional clause, but otherwise
 187      we don't need to account empty times and sizes.  */
 188   if (!size && time == 0 && table->length ())
 189     return;
 190
 191   /* Only for calls we are unaccounting what we previously recorded.  */
 192   gcc_checking_assert (time >= 0 || call);
 193
 194   for (i = 0; table->iterate (i, &e); i++)
 195     if (e->exec_predicate == exec_pred
 196         && e->nonconst_predicate == nonconst_pred)
 197       {
 198         found = true;
 199         break;
 200       }
 201   if (i == max_size_time_table_size)
 202     {
 203       i = 0;
 204       found = true;
 205       e = &(*table)[0];
 206       if (dump_file && (dump_flags & TDF_DETAILS))
 207         fprintf (dump_file,
 208                  "\t\tReached limit on number of entries, "
 209                  "ignoring the predicate.");
 210     }
 211   if (dump_file && (dump_flags & TDF_DETAILS) && (time != 0 || size))
 212     {
 213       fprintf (dump_file,
 214                "\t\tAccounting size:%3.2f, time:%3.2f on %spredicate exec:",
 215                ((double) size) / ipa_fn_summary::size_scale,
 216                (time.to_double ()), found ? "" : "new ");
 217       exec_pred.dump (dump_file, conds, 0);
 218       if (exec_pred != nonconst_pred)
 219         {
 220           fprintf (dump_file, " nonconst:");
 221           nonconst_pred.dump (dump_file, conds);
 222         }
 223       else
 224         fprintf (dump_file, "\n");
 225     }
 226   if (!found)
 227     {
 228       class size_time_entry new_entry;
 229       new_entry.size = size;
 230       new_entry.time = time;
 231       new_entry.exec_predicate = exec_pred;
 232       new_entry.nonconst_predicate = nonconst_pred;
 233       if (call)
 234         call_size_time_table.safe_push (new_entry);
 235       else
 236         size_time_table.safe_push (new_entry);
 237     }
 238   else
 239     {
 240       e->size += size;
 241       e->time += time;
 242       /* FIXME: PR bootstrap/92653 gcc_checking_assert (e->time >= -1); */
 243       /* Tolerate small roundoff issues.  */
 244       if (e->time < 0)
 245         e->time = 0;
 246     }
 247 }
 248
 249 /* We proved E to be unreachable, redirect it to __builtin_unreachable.  */
 250
 251 static struct cgraph_edge *
 252 redirect_to_unreachable (struct cgraph_edge *e)
 253 {
 254   struct cgraph_node *callee = !e->inline_failed ? e->callee : NULL;
 255   struct cgraph_node *target
 256     = cgraph_node::get_create (builtin_decl_unreachable ());
 257
 258   if (e->speculative)
 259     e = cgraph_edge::resolve_speculation (e, target->decl);
 260   else if (!e->callee)
 261     e = cgraph_edge::make_direct (e, target);
 262   else
 263     e->redirect_callee (target);
 264   class ipa_call_summary *es = ipa_call_summaries->get (e);
 265   e->inline_failed = CIF_UNREACHABLE;
 266   e->count = profile_count::zero ();
 267   es->call_stmt_size = 0;
 268   es->call_stmt_time = 0;
 269   if (callee)
 270     callee->remove_symbol_and_inline_clones ();
 271   return e;
 272 }
 273
 274 /* Set predicate for edge E.  */
 275
 276 static void
 277 edge_set_predicate (struct cgraph_edge *e, ipa_predicate *predicate)
 278 {
 279   /* If the edge is determined to be never executed, redirect it
 280      to BUILTIN_UNREACHABLE to make it clear to IPA passes the call will
 281      be optimized out.  */
 282   if (predicate && *predicate == false
 283       /* When handling speculative edges, we need to do the redirection
 284          just once.  Do it always on the direct edge, so we do not
 285          attempt to resolve speculation while duplicating the edge.  */
 286       && (!e->speculative || e->callee))
 287     e = redirect_to_unreachable (e);
 288
 289   class ipa_call_summary *es = ipa_call_summaries->get (e);
 290   if (predicate && *predicate != true)
 291     {
 292       if (!es->predicate)
 293         es->predicate = edge_predicate_pool.allocate ();
 294       *es->predicate = *predicate;
 295     }
 296   else
 297     {
 298       if (es->predicate)
 299         edge_predicate_pool.remove (es->predicate);
 300       es->predicate = NULL;
 301     }
 302 }
 303
 304 /* Set predicate for hint *P.  */
 305
 306 static void
 307 set_hint_predicate (ipa_predicate **p, ipa_predicate new_predicate)
 308 {
 309   if (new_predicate == false || new_predicate == true)
 310     {
 311       if (*p)
 312         edge_predicate_pool.remove (*p);
 313       *p = NULL;
 314     }
 315   else
 316     {
 317       if (!*p)
 318         *p = edge_predicate_pool.allocate ();
 319       **p = new_predicate;
 320     }
 321 }
 322
 323 /* Find if NEW_PREDICATE is already in V and if so, increment its freq.
 324    Otherwise add a new item to the vector with this predicate and frerq equal
 325    to add_freq, unless the number of predicates would exceed MAX_NUM_PREDICATES
 326    in which case the function does nothing.  */
 327
 328 static void
 329 add_freqcounting_predicate (vec<ipa_freqcounting_predicate, va_gc> **v,
 330                             const ipa_predicate &new_predicate, sreal add_freq,
 331                             unsigned max_num_predicates)
 332 {
 333   if (new_predicate == false || new_predicate == true)
 334     return;
 335   ipa_freqcounting_predicate *f;
 336   for (int i = 0; vec_safe_iterate (*v, i, &f); i++)
 337     if (new_predicate == f->predicate)
 338       {
 339         f->freq += add_freq;
 340         return;
 341       }
 342   if (vec_safe_length (*v) >= max_num_predicates)
 343     /* Too many different predicates to account for.  */
 344     return;
 345
 346   ipa_freqcounting_predicate fcp;
 347   fcp.predicate = NULL;
 348   set_hint_predicate (&fcp.predicate, new_predicate);
 349   fcp.freq = add_freq;
 350   vec_safe_push (*v, fcp);
 351   return;
 352 }
 353
 354 /* Compute what conditions may or may not hold given information about
 355    parameters.  RET_CLAUSE returns truths that may hold in a specialized copy,
 356    while RET_NONSPEC_CLAUSE returns truths that may hold in an nonspecialized
 357    copy when called in a given context.  It is a bitmask of conditions. Bit
 358    0 means that condition is known to be false, while bit 1 means that condition
 359    may or may not be true.  These differs - for example NOT_INLINED condition
 360    is always false in the second and also builtin_constant_p tests cannot use
 361    the fact that parameter is indeed a constant.
 362
 363    When INLINE_P is true, assume that we are inlining.  AVAL contains known
 364    information about argument values.  The function does not modify its content
 365    and so AVALs could also be of type ipa_call_arg_values but so far all
 366    callers work with the auto version and so we avoid the conversion for
 367    convenience.
 368
 369    ERROR_MARK value of an argument means compile time invariant.  */
 370
 371 static void
 372 evaluate_conditions_for_known_args (struct cgraph_node *node,
 373                                     bool inline_p,
 374                                     ipa_auto_call_arg_values *avals,
 375                                     clause_t *ret_clause,
 376                                     clause_t *ret_nonspec_clause,
 377                                     ipa_call_summary *es)
 378 {
 379   clause_t clause = inline_p ? 0 : 1 << ipa_predicate::not_inlined_condition;
 380   clause_t nonspec_clause = 1 << ipa_predicate::not_inlined_condition;
 381   class ipa_fn_summary *info = ipa_fn_summaries->get (node);
 382   int i;
 383   struct condition *c;
 384
 385   for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
 386     {
 387       tree val = NULL;
 388       tree res;
 389       int j;
 390       struct expr_eval_op *op;
 391
 392       if (c->code == ipa_predicate::not_sra_candidate)
 393         {
 394           if (!inline_p
 395               || !es
 396               || (int)es->param.length () <= c->operand_num
 397               || !es->param[c->operand_num].points_to_possible_sra_candidate)
 398             clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 399           nonspec_clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 400           continue;
 401         }
 402
 403       if (c->agg_contents)
 404         {
 405           if (c->code == ipa_predicate::changed
 406               && !c->by_ref
 407               && (avals->safe_sval_at(c->operand_num) == error_mark_node))
 408             continue;
 409
 410           if (tree sval = avals->safe_sval_at (c->operand_num))
 411             val = ipa_find_agg_cst_from_init (sval, c->offset, c->by_ref);
 412           if (!val)
 413             {
 414               ipa_argagg_value_list avs (avals);
 415               val = avs.get_value (c->operand_num, c->offset / BITS_PER_UNIT,
 416                                    c->by_ref);
 417             }
 418         }
 419       else
 420         {
 421           val = avals->safe_sval_at (c->operand_num);
 422           if (val && val == error_mark_node
 423               && c->code != ipa_predicate::changed)
 424             val = NULL_TREE;
 425         }
 426
 427       if (!val
 428           && (c->code == ipa_predicate::changed
 429               || c->code == ipa_predicate::is_not_constant))
 430         {
 431           clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 432           nonspec_clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 433           continue;
 434         }
 435       if (c->code == ipa_predicate::changed)
 436         {
 437           nonspec_clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 438           continue;
 439         }
 440
 441       if (c->code == ipa_predicate::is_not_constant)
 442         {
 443           nonspec_clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 444           continue;
 445         }
 446
 447       if (val && TYPE_SIZE (c->type) == TYPE_SIZE (TREE_TYPE (val)))
 448         {
 449           if (c->type != TREE_TYPE (val))
 450             val = fold_unary (VIEW_CONVERT_EXPR, c->type, val);
 451           for (j = 0; vec_safe_iterate (c->param_ops, j, &op); j++)
 452             {
 453               if (!val)
 454                 break;
 455               if (!op->val[0])
 456                 val = fold_unary (op->code, op->type, val);
 457               else if (!op->val[1])
 458                 val = fold_binary (op->code, op->type,
 459                                    op->index ? op->val[0] : val,
 460                                    op->index ? val : op->val[0]);
 461               else if (op->index == 0)
 462                 val = fold_ternary (op->code, op->type,
 463                                     val, op->val[0], op->val[1]);
 464               else if (op->index == 1)
 465                 val = fold_ternary (op->code, op->type,
 466                                     op->val[0], val, op->val[1]);
 467               else if (op->index == 2)
 468                 val = fold_ternary (op->code, op->type,
 469                                     op->val[0], op->val[1], val);
 470               else
 471                 val = NULL_TREE;
 472             }
 473
 474           res = val
 475             ? fold_binary_to_constant (c->code, boolean_type_node, val, c->val)
 476             : NULL;
 477
 478           if (res && integer_zerop (res))
 479             continue;
 480           if (res && integer_onep (res))
 481             {
 482               clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 483               nonspec_clause
 484                 |= 1 << (i + ipa_predicate::first_dynamic_condition);
 485               continue;
 486             }
 487         }
 488       if (c->operand_num < (int) avals->m_known_value_ranges.length ()
 489           && !c->agg_contents
 490           && (!val || TREE_CODE (val) != INTEGER_CST))
 491         {
 492           Value_Range vr (avals->m_known_value_ranges[c->operand_num]);
 493           if (!vr.undefined_p ()
 494               && !vr.varying_p ()
 495               && (TYPE_SIZE (c->type) == TYPE_SIZE (vr.type ())))
 496             {
 497               if (!useless_type_conversion_p (c->type, vr.type ()))
 498                 range_cast (vr, c->type);
 499
 500               for (j = 0; vec_safe_iterate (c->param_ops, j, &op); j++)
 501                 {
 502                   if (vr.varying_p () || vr.undefined_p ())
 503                     break;
 504
 505                   Value_Range res (op->type);
 506                   if (!op->val[0])
 507                     {
 508                       Value_Range varying (op->type);
 509                       varying.set_varying (op->type);
 510                       range_op_handler handler (op->code);
 511                       if (!handler
 512                           || !res.supports_type_p (op->type)
 513                           || !handler.fold_range (res, op->type, vr, varying))
 514                         res.set_varying (op->type);
 515                     }
 516                   else if (!op->val[1])
 517                     {
 518                       Value_Range op0 (op->type);
 519                       range_op_handler handler (op->code);
 520
 521                       ipa_range_set_and_normalize (op0, op->val[0]);
 522
 523                       if (!handler
 524                           || !res.supports_type_p (op->type)
 525                           || !handler.fold_range (res, op->type,
 526                                                   op->index ? op0 : vr,
 527                                                   op->index ? vr : op0))
 528                         res.set_varying (op->type);
 529                     }
 530                   else
 531                     res.set_varying (op->type);
 532                   vr = res;
 533                 }
 534               if (!vr.varying_p () && !vr.undefined_p ())
 535                 {
 536                   int_range<2> res;
 537                   Value_Range val_vr (TREE_TYPE (c->val));
 538                   range_op_handler handler (c->code);
 539
 540                   ipa_range_set_and_normalize (val_vr, c->val);
 541
 542                   if (!handler
 543                       || !val_vr.supports_type_p (TREE_TYPE (c->val))
 544                       || !handler.fold_range (res, boolean_type_node, vr, val_vr))
 545                     res.set_varying (boolean_type_node);
 546
 547                   if (res.zero_p ())
 548                     continue;
 549                 }
 550             }
 551         }
 552
 553       clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 554       nonspec_clause |= 1 << (i + ipa_predicate::first_dynamic_condition);
 555     }
 556   *ret_clause = clause;
 557   if (ret_nonspec_clause)
 558     *ret_nonspec_clause = nonspec_clause;
 559 }
 560
 561 /* Return true if VRP will be exectued on the function.
 562    We do not want to anticipate optimizations that will not happen.
 563
 564    FIXME: This can be confused with -fdisable and debug counters and thus
 565    it should not be used for correctness (only to make heuristics work).
 566    This means that inliner should do its own optimizations of expressions
 567    that it predicts to be constant so wrong code can not be triggered by
 568    builtin_constant_p.  */
 569
 570 static bool
 571 vrp_will_run_p (struct cgraph_node *node)
 572 {
 573   return (opt_for_fn (node->decl, optimize)
 574           && !opt_for_fn (node->decl, optimize_debug)
 575           && opt_for_fn (node->decl, flag_tree_vrp));
 576 }
 577
 578 /* Similarly about FRE.  */
 579
 580 static bool
 581 fre_will_run_p (struct cgraph_node *node)
 582 {
 583   return (opt_for_fn (node->decl, optimize)
 584           && !opt_for_fn (node->decl, optimize_debug)
 585           && opt_for_fn (node->decl, flag_tree_fre));
 586 }
 587
 588 /* Work out what conditions might be true at invocation of E.
 589    Compute costs for inlined edge if INLINE_P is true.
 590
 591    Return in CLAUSE_PTR the evaluated conditions and in NONSPEC_CLAUSE_PTR
 592    (if non-NULL) conditions evaluated for nonspecialized clone called
 593    in a given context.
 594
 595    Vectors in AVALS will be populated with useful known information about
 596    argument values - information not known to have any uses will be omitted -
 597    except for m_known_contexts which will only be calculated if
 598    COMPUTE_CONTEXTS is true.  */
 599
 600 void
 601 evaluate_properties_for_edge (struct cgraph_edge *e, bool inline_p,
 602                               clause_t *clause_ptr,
 603                               clause_t *nonspec_clause_ptr,
 604                               ipa_auto_call_arg_values *avals,
 605                               bool compute_contexts)
 606 {
 607   struct cgraph_node *callee = e->callee->ultimate_alias_target ();
 608   class ipa_fn_summary *info = ipa_fn_summaries->get (callee);
 609   class ipa_edge_args *args;
 610   class ipa_call_summary *es = NULL;
 611
 612   if (clause_ptr)
 613     *clause_ptr = inline_p ? 0 : 1 << ipa_predicate::not_inlined_condition;
 614
 615   if (ipa_node_params_sum
 616       && !e->call_stmt_cannot_inline_p
 617       && (info->conds || compute_contexts)
 618       && (args = ipa_edge_args_sum->get (e)) != NULL)
 619     {
 620       struct cgraph_node *caller;
 621       class ipa_node_params *caller_parms_info, *callee_pi = NULL;
 622       int i, count = ipa_get_cs_argument_count (args);
 623       es = ipa_call_summaries->get (e);
 624
 625       if (count)
 626         {
 627           if (e->caller->inlined_to)
 628             caller = e->caller->inlined_to;
 629           else
 630             caller = e->caller;
 631           caller_parms_info = ipa_node_params_sum->get (caller);
 632           callee_pi = ipa_node_params_sum->get (callee);
 633
 634           /* Watch for thunks.  */
 635           if (callee_pi)
 636             /* Watch for variadic functions.  */
 637             count = MIN (count, ipa_get_param_count (callee_pi));
 638         }
 639
 640       if (callee_pi)
 641         for (i = 0; i < count; i++)
 642           {
 643             struct ipa_jump_func *jf = ipa_get_ith_jump_func (args, i);
 644
 645             if (ipa_is_param_used_by_indirect_call (callee_pi, i)
 646                 || ipa_is_param_used_by_ipa_predicates (callee_pi, i))
 647               {
 648                 /* Determine if we know constant value of the parameter.  */
 649                 tree type = ipa_get_type (callee_pi, i);
 650                 tree cst = ipa_value_from_jfunc (caller_parms_info, jf, type);
 651
 652                 if (!cst && e->call_stmt
 653                     && i < (int)gimple_call_num_args (e->call_stmt))
 654                   {
 655                     cst = gimple_call_arg (e->call_stmt, i);
 656                     if (!is_gimple_min_invariant (cst))
 657                       cst = NULL;
 658                   }
 659                 if (cst)
 660                   {
 661                     gcc_checking_assert (TREE_CODE (cst) != TREE_BINFO);
 662                     if (!avals->m_known_vals.length ())
 663                       avals->m_known_vals.safe_grow_cleared (count, true);
 664                     avals->m_known_vals[i] = cst;
 665                   }
 666                 else if (inline_p && !es->param[i].change_prob)
 667                   {
 668                     if (!avals->m_known_vals.length ())
 669                       avals->m_known_vals.safe_grow_cleared (count, true);
 670                     avals->m_known_vals[i] = error_mark_node;
 671                   }
 672
 673                 /* If we failed to get simple constant, try value range.  */
 674                 if ((!cst || TREE_CODE (cst) != INTEGER_CST)
 675                     && vrp_will_run_p (caller)
 676                     && ipa_is_param_used_by_ipa_predicates (callee_pi, i))
 677                   {
 678                     Value_Range vr (type);
 679
 680                     ipa_value_range_from_jfunc (vr, caller_parms_info, e, jf, type);
 681                     if (!vr.undefined_p () && !vr.varying_p ())
 682                       {
 683                         if (!avals->m_known_value_ranges.length ())
 684                           {
 685                             avals->m_known_value_ranges.safe_grow_cleared (count,
 686                                                                            true);
 687                             for (int i = 0; i < count; ++i)
 688                               avals->m_known_value_ranges[i].set_type (void_type_node);
 689                           }
 690                         avals->m_known_value_ranges[i] = vr;
 691                       }
 692                   }
 693
 694                 /* Determine known aggregate values.  */
 695                 if (fre_will_run_p (caller))
 696                   ipa_push_agg_values_from_jfunc (caller_parms_info,
 697                                                   caller, &jf->agg, i,
 698                                                   &avals->m_known_aggs);
 699               }
 700
 701             /* For calls used in polymorphic calls we further determine
 702                polymorphic call context.  */
 703             if (compute_contexts
 704                 && ipa_is_param_used_by_polymorphic_call (callee_pi, i))
 705               {
 706                 ipa_polymorphic_call_context
 707                    ctx = ipa_context_from_jfunc (caller_parms_info, e, i, jf);
 708                 if (!ctx.useless_p ())
 709                   {
 710                     if (!avals->m_known_contexts.length ())
 711                       avals->m_known_contexts.safe_grow_cleared (count, true);
 712                     avals->m_known_contexts[i]
 713                       = ipa_context_from_jfunc (caller_parms_info, e, i, jf);
 714                   }
 715                }
 716           }
 717         else
 718           gcc_assert (!count || callee->thunk);
 719     }
 720   else if (e->call_stmt && !e->call_stmt_cannot_inline_p && info->conds)
 721     {
 722       int i, count = (int)gimple_call_num_args (e->call_stmt);
 723
 724       for (i = 0; i < count; i++)
 725         {
 726           tree cst = gimple_call_arg (e->call_stmt, i);
 727           if (!is_gimple_min_invariant (cst))
 728             cst = NULL;
 729           if (cst)
 730             {
 731               if (!avals->m_known_vals.length ())
 732                 avals->m_known_vals.safe_grow_cleared (count, true);
 733               avals->m_known_vals[i] = cst;
 734             }
 735         }
 736     }
 737
 738   evaluate_conditions_for_known_args (callee, inline_p, avals, clause_ptr,
 739                                       nonspec_clause_ptr, es);
 740 }
 741
 742
 743 /* Allocate the function summary. */
 744
 745 static void
 746 ipa_fn_summary_alloc (void)
 747 {
 748   gcc_checking_assert (!ipa_fn_summaries);
 749   ipa_size_summaries = new ipa_size_summary_t (symtab);
 750   ipa_fn_summaries = ipa_fn_summary_t::create_ggc (symtab);
 751   ipa_call_summaries = new ipa_call_summary_t (symtab);
 752 }
 753
 754 ipa_call_summary::~ipa_call_summary ()
 755 {
 756   if (predicate)
 757     edge_predicate_pool.remove (predicate);
 758
 759   param.release ();
 760 }
 761
 762 ipa_fn_summary::~ipa_fn_summary ()
 763 {
 764   unsigned len = vec_safe_length (loop_iterations);
 765   for (unsigned i = 0; i < len; i++)
 766     edge_predicate_pool.remove ((*loop_iterations)[i].predicate);
 767   len = vec_safe_length (loop_strides);
 768   for (unsigned i = 0; i < len; i++)
 769     edge_predicate_pool.remove ((*loop_strides)[i].predicate);
 770   vec_free (conds);
 771   call_size_time_table.release ();
 772   vec_free (loop_iterations);
 773   vec_free (loop_strides);
 774   builtin_constant_p_parms.release ();
 775 }
 776
 777 void
 778 ipa_fn_summary_t::remove_callees (cgraph_node *node)
 779 {
 780   cgraph_edge *e;
 781   for (e = node->callees; e; e = e->next_callee)
 782     ipa_call_summaries->remove (e);
 783   for (e = node->indirect_calls; e; e = e->next_callee)
 784     ipa_call_summaries->remove (e);
 785 }
 786
 787 /* Duplicate predicates in loop hint vector, allocating memory for them and
 788    remove and deallocate any uninteresting (true or false) ones.  Return the
 789    result.  */
 790
 791 static vec<ipa_freqcounting_predicate, va_gc> *
 792 remap_freqcounting_preds_after_dup (vec<ipa_freqcounting_predicate, va_gc> *v,
 793                                     clause_t possible_truths)
 794 {
 795   if (vec_safe_length (v) == 0)
 796     return NULL;
 797
 798   vec<ipa_freqcounting_predicate, va_gc> *res = v->copy ();
 799   int len = res->length();
 800   for (int i = len - 1; i >= 0; i--)
 801     {
 802       ipa_predicate new_predicate
 803         = (*res)[i].predicate->remap_after_duplication (possible_truths);
 804       /* We do not want to free previous predicate; it is used by node
 805          origin.  */
 806       (*res)[i].predicate = NULL;
 807       set_hint_predicate (&(*res)[i].predicate, new_predicate);
 808
 809       if (!(*res)[i].predicate)
 810         res->unordered_remove (i);
 811     }
 812
 813   return res;
 814 }
 815
 816
 817 /* Hook that is called by cgraph.cc when a node is duplicated.  */
 818 void
 819 ipa_fn_summary_t::duplicate (cgraph_node *src,
 820                              cgraph_node *dst,
 821                              ipa_fn_summary *src_info,
 822                              ipa_fn_summary *info)
 823 {
 824   new (info) ipa_fn_summary (*src_info);
 825   /* TODO: as an optimization, we may avoid copying conditions
 826      that are known to be false or true.  */
 827   info->conds = vec_safe_copy (info->conds);
 828
 829   clone_info *cinfo = clone_info::get (dst);
 830   /* When there are any replacements in the function body, see if we can figure
 831      out that something was optimized out.  */
 832   if (ipa_node_params_sum && cinfo && cinfo->tree_map)
 833     {
 834       /* Use SRC parm info since it may not be copied yet.  */
 835       ipa_node_params *parms_info = ipa_node_params_sum->get (src);
 836       ipa_auto_call_arg_values avals;
 837       int count = ipa_get_param_count (parms_info);
 838       int i, j;
 839       clause_t possible_truths;
 840       ipa_predicate true_pred = true;
 841       size_time_entry *e;
 842       int optimized_out_size = 0;
 843       bool inlined_to_p = false;
 844       struct cgraph_edge *edge, *next;
 845
 846       info->size_time_table.release ();
 847       avals.m_known_vals.safe_grow_cleared (count, true);
 848       for (i = 0; i < count; i++)
 849         {
 850           struct ipa_replace_map *r;
 851
 852           for (j = 0; vec_safe_iterate (cinfo->tree_map, j, &r); j++)
 853             {
 854               if (r->parm_num == i)
 855                 {
 856                   avals.m_known_vals[i] = r->new_tree;
 857                   break;
 858                 }
 859             }
 860         }
 861       evaluate_conditions_for_known_args (dst, false,
 862                                           &avals,
 863                                           &possible_truths,
 864                                           /* We are going to specialize,
 865                                              so ignore nonspec truths.  */
 866                                           NULL,
 867                                           NULL);
 868
 869       info->account_size_time (0, 0, true_pred, true_pred);
 870
 871       /* Remap size_time vectors.
 872          Simplify the predicate by pruning out alternatives that are known
 873          to be false.
 874          TODO: as on optimization, we can also eliminate conditions known
 875          to be true.  */
 876       for (i = 0; src_info->size_time_table.iterate (i, &e); i++)
 877         {
 878           ipa_predicate new_exec_pred;
 879           ipa_predicate new_nonconst_pred;
 880           new_exec_pred = e->exec_predicate.remap_after_duplication
 881                                  (possible_truths);
 882           new_nonconst_pred = e->nonconst_predicate.remap_after_duplication
 883                                  (possible_truths);
 884           if (new_exec_pred == false || new_nonconst_pred == false)
 885             optimized_out_size += e->size;
 886           else
 887             info->account_size_time (e->size, e->time, new_exec_pred,
 888                                      new_nonconst_pred);
 889         }
 890
 891       /* Remap edge predicates with the same simplification as above.
 892          Also copy constantness arrays.   */
 893       for (edge = dst->callees; edge; edge = next)
 894         {
 895           ipa_predicate new_predicate;
 896           class ipa_call_summary *es = ipa_call_summaries->get (edge);
 897           next = edge->next_callee;
 898
 899           if (!edge->inline_failed)
 900             inlined_to_p = true;
 901           if (!es->predicate)
 902             continue;
 903           new_predicate = es->predicate->remap_after_duplication
 904             (possible_truths);
 905           if (new_predicate == false && *es->predicate != false)
 906             optimized_out_size += es->call_stmt_size * ipa_fn_summary::size_scale;
 907           edge_set_predicate (edge, &new_predicate);
 908         }
 909
 910       /* Remap indirect edge predicates with the same simplification as above.
 911          Also copy constantness arrays.   */
 912       for (edge = dst->indirect_calls; edge; edge = next)
 913         {
 914           ipa_predicate new_predicate;
 915           class ipa_call_summary *es = ipa_call_summaries->get (edge);
 916           next = edge->next_callee;
 917
 918           gcc_checking_assert (edge->inline_failed);
 919           if (!es->predicate)
 920             continue;
 921           new_predicate = es->predicate->remap_after_duplication
 922                                  (possible_truths);
 923           if (new_predicate == false && *es->predicate != false)
 924             optimized_out_size
 925                  += es->call_stmt_size * ipa_fn_summary::size_scale;
 926           edge_set_predicate (edge, &new_predicate);
 927         }
 928       info->loop_iterations
 929         = remap_freqcounting_preds_after_dup (info->loop_iterations,
 930                                               possible_truths);
 931       info->loop_strides
 932         = remap_freqcounting_preds_after_dup (info->loop_strides,
 933                                               possible_truths);
 934       if (info->builtin_constant_p_parms.length())
 935         {
 936           vec <int, va_heap, vl_ptr> parms = info->builtin_constant_p_parms;
 937           int ip;
 938           info->builtin_constant_p_parms = vNULL;
 939           for (i = 0; parms.iterate (i, &ip); i++)
 940             if (!avals.m_known_vals[ip])
 941               info->builtin_constant_p_parms.safe_push (ip);
 942         }
 943
 944       /* If inliner or someone after inliner will ever start producing
 945          non-trivial clones, we will get trouble with lack of information
 946          about updating self sizes, because size vectors already contains
 947          sizes of the callees.  */
 948       gcc_assert (!inlined_to_p || !optimized_out_size);
 949     }
 950   else
 951     {
 952       info->size_time_table = src_info->size_time_table.copy ();
 953       info->loop_iterations = vec_safe_copy (src_info->loop_iterations);
 954       info->loop_strides = vec_safe_copy (info->loop_strides);
 955
 956       info->builtin_constant_p_parms
 957              = info->builtin_constant_p_parms.copy ();
 958
 959       ipa_freqcounting_predicate *f;
 960       for (int i = 0; vec_safe_iterate (info->loop_iterations, i, &f); i++)
 961         {
 962           ipa_predicate p = *f->predicate;
 963           f->predicate = NULL;
 964           set_hint_predicate (&f->predicate, p);
 965         }
 966       for (int i = 0; vec_safe_iterate (info->loop_strides, i, &f); i++)
 967         {
 968           ipa_predicate p = *f->predicate;
 969           f->predicate = NULL;
 970           set_hint_predicate (&f->predicate, p);
 971         }
 972     }
 973   if (!dst->inlined_to)
 974     ipa_update_overall_fn_summary (dst);
 975 }
 976
 977
 978 /* Hook that is called by cgraph.cc when a node is duplicated.  */
 979
 980 void
 981 ipa_call_summary_t::duplicate (struct cgraph_edge *src,
 982                                struct cgraph_edge *dst,
 983                                class ipa_call_summary *srcinfo,
 984                                class ipa_call_summary *info)
 985 {
 986   new (info) ipa_call_summary (*srcinfo);
 987   info->predicate = NULL;
 988   edge_set_predicate (dst, srcinfo->predicate);
 989   info->param = srcinfo->param.copy ();
 990   if (!dst->indirect_unknown_callee && src->indirect_unknown_callee)
 991     {
 992       info->call_stmt_size -= (eni_size_weights.indirect_call_cost
 993                                - eni_size_weights.call_cost);
 994       info->call_stmt_time -= (eni_time_weights.indirect_call_cost
 995                                - eni_time_weights.call_cost);
 996     }
 997 }
 998
 999 /* Dump edge summaries associated to NODE and recursively to all clones.
1000    Indent by INDENT.  */
1001
1002 static void
1003 dump_ipa_call_summary (FILE *f, int indent, struct cgraph_node *node,
1004                        class ipa_fn_summary *info)
1005 {
1006   struct cgraph_edge *edge;
1007   for (edge = node->callees; edge; edge = edge->next_callee)
1008     {
1009       class ipa_call_summary *es = ipa_call_summaries->get (edge);
1010       struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
1011       int i;
1012
1013       fprintf (f,
1014                "%*s%s %s\n%*s  freq:%4.2f",
1015                indent, "", callee->dump_name (),
1016                !edge->inline_failed
1017                ? "inlined" : cgraph_inline_failed_string (edge-> inline_failed),
1018                indent, "", edge->sreal_frequency ().to_double ());
1019
1020       if (cross_module_call_p (edge))
1021         fprintf (f, " cross module");
1022
1023       if (es)
1024         fprintf (f, " loop depth:%2i size:%2i time: %2i",
1025                  es->loop_depth, es->call_stmt_size, es->call_stmt_time);
1026
1027       ipa_fn_summary *s = ipa_fn_summaries->get (callee);
1028       ipa_size_summary *ss = ipa_size_summaries->get (callee);
1029       if (s != NULL)
1030         fprintf (f, " callee size:%2i stack:%2i",
1031                  (int) (ss->size / ipa_fn_summary::size_scale),
1032                  (int) s->estimated_stack_size);
1033
1034       if (es && es->predicate)
1035         {
1036           fprintf (f, " predicate: ");
1037           es->predicate->dump (f, info->conds);
1038         }
1039       else
1040         fprintf (f, "\n");
1041       if (es && es->param.exists ())
1042         for (i = 0; i < (int) es->param.length (); i++)
1043           {
1044             int prob = es->param[i].change_prob;
1045
1046             if (!prob)
1047               fprintf (f, "%*s op%i is compile time invariant\n",
1048                        indent + 2, "", i);
1049             else if (prob != REG_BR_PROB_BASE)
1050               fprintf (f, "%*s op%i change %f%% of time\n", indent + 2, "", i,
1051                        prob * 100.0 / REG_BR_PROB_BASE);
1052             if (es->param[i].points_to_local_or_readonly_memory)
1053               fprintf (f, "%*s op%i points to local or readonly memory\n",
1054                        indent + 2, "", i);
1055             if (es->param[i].points_to_possible_sra_candidate)
1056               fprintf (f, "%*s op%i points to possible sra candidate\n",
1057                        indent + 2, "", i);
1058           }
1059       if (!edge->inline_failed)
1060         {
1061           ipa_size_summary *ss = ipa_size_summaries->get (callee);
1062           fprintf (f, "%*sStack frame offset %i, callee self size %i\n",
1063                    indent + 2, "",
1064                    (int) ipa_get_stack_frame_offset (callee),
1065                    (int) ss->estimated_self_stack_size);
1066           dump_ipa_call_summary (f, indent + 2, callee, info);
1067         }
1068     }
1069   for (edge = node->indirect_calls; edge; edge = edge->next_callee)
1070     {
1071       class ipa_call_summary *es = ipa_call_summaries->get (edge);
1072       fprintf (f, "%*sindirect call loop depth:%2i freq:%4.2f size:%2i"
1073                " time: %2i",
1074                indent, "",
1075                es->loop_depth,
1076                edge->sreal_frequency ().to_double (), es->call_stmt_size,
1077                es->call_stmt_time);
1078       if (es->predicate)
1079         {
1080           fprintf (f, "predicate: ");
1081           es->predicate->dump (f, info->conds);
1082         }
1083       else
1084         fprintf (f, "\n");
1085     }
1086 }
1087
1088
1089 void
1090 ipa_dump_fn_summary (FILE *f, struct cgraph_node *node)
1091 {
1092   if (node->definition)
1093     {
1094       class ipa_fn_summary *s = ipa_fn_summaries->get (node);
1095       class ipa_size_summary *ss = ipa_size_summaries->get (node);
1096       if (s != NULL)
1097         {
1098           size_time_entry *e;
1099           int i;
1100           fprintf (f, "IPA function summary for %s", node->dump_name ());
1101           if (DECL_DISREGARD_INLINE_LIMITS (node->decl))
1102             fprintf (f, " always_inline");
1103           if (s->inlinable)
1104             fprintf (f, " inlinable");
1105           if (s->fp_expressions)
1106             fprintf (f, " fp_expression");
1107           if (s->builtin_constant_p_parms.length ())
1108             {
1109               fprintf (f, " builtin_constant_p_parms");
1110               for (unsigned int i = 0;
1111                    i < s->builtin_constant_p_parms.length (); i++)
1112                 fprintf (f, " %i", s->builtin_constant_p_parms[i]);
1113             }
1114           fprintf (f, "\n  global time:     %f\n", s->time.to_double ());
1115           fprintf (f, "  self size:       %i\n", ss->self_size);
1116           fprintf (f, "  global size:     %i\n", ss->size);
1117           fprintf (f, "  min size:       %i\n", s->min_size);
1118           fprintf (f, "  self stack:      %i\n",
1119                    (int) ss->estimated_self_stack_size);
1120           fprintf (f, "  global stack:    %i\n", (int) s->estimated_stack_size);
1121           if (s->growth)
1122             fprintf (f, "  estimated growth:%i\n", (int) s->growth);
1123           if (s->scc_no)
1124             fprintf (f, "  In SCC:          %i\n", (int) s->scc_no);
1125           for (i = 0; s->size_time_table.iterate (i, &e); i++)
1126             {
1127               fprintf (f, "    size:%f, time:%f",
1128                        (double) e->size / ipa_fn_summary::size_scale,
1129                        e->time.to_double ());
1130               if (e->exec_predicate != true)
1131                 {
1132                   fprintf (f, ",  executed if:");
1133                   e->exec_predicate.dump (f, s->conds, 0);
1134                 }
1135               if (e->exec_predicate != e->nonconst_predicate)
1136                 {
1137                   fprintf (f, ",  nonconst if:");
1138                   e->nonconst_predicate.dump (f, s->conds, 0);
1139                 }
1140               fprintf (f, "\n");
1141             }
1142           ipa_freqcounting_predicate *fcp;
1143           bool first_fcp = true;
1144           for (int i = 0; vec_safe_iterate (s->loop_iterations, i, &fcp); i++)
1145             {
1146               if (first_fcp)
1147                 {
1148                   fprintf (f, "  loop iterations:");
1149                   first_fcp = false;
1150                 }
1151               fprintf (f, "  %3.2f for ", fcp->freq.to_double ());
1152               fcp->predicate->dump (f, s->conds);
1153             }
1154           first_fcp = true;
1155           for (int i = 0; vec_safe_iterate (s->loop_strides, i, &fcp); i++)
1156             {
1157               if (first_fcp)
1158                 {
1159                   fprintf (f, "  loop strides:");
1160                   first_fcp = false;
1161                 }
1162               fprintf (f, "  %3.2f for :", fcp->freq.to_double ());
1163               fcp->predicate->dump (f, s->conds);
1164             }
1165           fprintf (f, "  calls:\n");
1166           dump_ipa_call_summary (f, 4, node, s);
1167           fprintf (f, "\n");
1168           if (s->target_info)
1169             fprintf (f, "  target_info: %x\n", s->target_info);
1170         }
1171       else
1172         fprintf (f, "IPA summary for %s is missing.\n", node->dump_name ());
1173     }
1174 }
1175
1176 DEBUG_FUNCTION void
1177 ipa_debug_fn_summary (struct cgraph_node *node)
1178 {
1179   ipa_dump_fn_summary (stderr, node);
1180 }
1181
1182 void
1183 ipa_dump_fn_summaries (FILE *f)
1184 {
1185   struct cgraph_node *node;
1186
1187   FOR_EACH_DEFINED_FUNCTION (node)
1188     if (!node->inlined_to)
1189       ipa_dump_fn_summary (f, node);
1190 }
1191
1192 /* Callback of walk_aliased_vdefs.  Flags that it has been invoked to the
1193    boolean variable pointed to by DATA.  */
1194
1195 static bool
1196 mark_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef ATTRIBUTE_UNUSED,
1197                void *data)
1198 {
1199   bool *b = (bool *) data;
1200   *b = true;
1201   return true;
1202 }
1203
1204 /* If OP refers to value of function parameter, return the corresponding
1205    parameter.  If non-NULL, the size of the memory load (or the SSA_NAME of the
1206    PARM_DECL) will be stored to *SIZE_P in that case too.  */
1207
1208 static tree
1209 unmodified_parm_1 (ipa_func_body_info *fbi, gimple *stmt, tree op,
1210                    poly_int64 *size_p)
1211 {
1212   /* SSA_NAME referring to parm default def?  */
1213   if (TREE_CODE (op) == SSA_NAME
1214       && SSA_NAME_IS_DEFAULT_DEF (op)
1215       && TREE_CODE (SSA_NAME_VAR (op)) == PARM_DECL)
1216     {
1217       if (size_p)
1218         *size_p = tree_to_poly_int64 (TYPE_SIZE (TREE_TYPE (op)));
1219       return SSA_NAME_VAR (op);
1220     }
1221   /* Non-SSA parm reference?  */
1222   if (TREE_CODE (op) == PARM_DECL
1223       && fbi->aa_walk_budget > 0)
1224     {
1225       bool modified = false;
1226
1227       ao_ref refd;
1228       ao_ref_init (&refd, op);
1229       int walked = walk_aliased_vdefs (&refd, gimple_vuse (stmt),
1230                                        mark_modified, &modified, NULL, NULL,
1231                                        fbi->aa_walk_budget);
1232       if (walked < 0)
1233         {
1234           fbi->aa_walk_budget = 0;
1235           return NULL_TREE;
1236         }
1237       fbi->aa_walk_budget -= walked;
1238       if (!modified)
1239         {
1240           if (size_p)
1241             *size_p = tree_to_poly_int64 (TYPE_SIZE (TREE_TYPE (op)));
1242           return op;
1243         }
1244     }
1245   return NULL_TREE;
1246 }
1247
1248 /* If OP refers to value of function parameter, return the corresponding
1249    parameter.  Also traverse chains of SSA register assignments.  If non-NULL,
1250    the size of the memory load (or the SSA_NAME of the PARM_DECL) will be
1251    stored to *SIZE_P in that case too.  */
1252
1253 static tree
1254 unmodified_parm (ipa_func_body_info *fbi, gimple *stmt, tree op,
1255                  poly_int64 *size_p)
1256 {
1257   tree res = unmodified_parm_1 (fbi, stmt, op, size_p);
1258   if (res)
1259     return res;
1260
1261   if (TREE_CODE (op) == SSA_NAME
1262       && !SSA_NAME_IS_DEFAULT_DEF (op)
1263       && gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1264     return unmodified_parm (fbi, SSA_NAME_DEF_STMT (op),
1265                             gimple_assign_rhs1 (SSA_NAME_DEF_STMT (op)),
1266                             size_p);
1267   return NULL_TREE;
1268 }
1269
1270 /* If OP refers to a value of a function parameter or value loaded from an
1271    aggregate passed to a parameter (either by value or reference), return TRUE
1272    and store the number of the parameter to *INDEX_P, the access size into
1273    *SIZE_P, and information whether and how it has been loaded from an
1274    aggregate into *AGGPOS.  INFO describes the function parameters, STMT is the
1275    statement in which OP is used or loaded.  */
1276
1277 static bool
1278 unmodified_parm_or_parm_agg_item (struct ipa_func_body_info *fbi,
1279                                   gimple *stmt, tree op, int *index_p,
1280                                   poly_int64 *size_p,
1281                                   struct agg_position_info *aggpos)
1282 {
1283   tree res = unmodified_parm_1 (fbi, stmt, op, size_p);
1284
1285   gcc_checking_assert (aggpos);
1286   if (res)
1287     {
1288       *index_p = ipa_get_param_decl_index (fbi->info, res);
1289       if (*index_p < 0)
1290         return false;
1291       aggpos->agg_contents = false;
1292       aggpos->by_ref = false;
1293       return true;
1294     }
1295
1296   if (TREE_CODE (op) == SSA_NAME)
1297     {
1298       if (SSA_NAME_IS_DEFAULT_DEF (op)
1299           || !gimple_assign_single_p (SSA_NAME_DEF_STMT (op)))
1300         return false;
1301       stmt = SSA_NAME_DEF_STMT (op);
1302       op = gimple_assign_rhs1 (stmt);
1303       if (!REFERENCE_CLASS_P (op))
1304         return unmodified_parm_or_parm_agg_item (fbi, stmt, op, index_p, size_p,
1305                                                  aggpos);
1306     }
1307
1308   aggpos->agg_contents = true;
1309   return ipa_load_from_parm_agg (fbi, fbi->info->descriptors,
1310                                  stmt, op, index_p, &aggpos->offset,
1311                                  size_p, &aggpos->by_ref);
1312 }
1313
1314 /* If stmt is simple load or store of value pointed to by a function parmaeter,
1315    return its index.  */
1316
1317 static int
1318 load_or_store_of_ptr_parameter (ipa_func_body_info *fbi, gimple *stmt)
1319 {
1320   if (!optimize)
1321     return -1;
1322   gassign *assign = dyn_cast <gassign *> (stmt);
1323   if (!assign)
1324     return -1;
1325   tree param;
1326   if (gimple_assign_load_p (stmt))
1327     param = gimple_assign_rhs1 (stmt);
1328   else if (gimple_store_p (stmt))
1329     param = gimple_assign_lhs (stmt);
1330   else
1331     return -1;
1332   tree base = get_base_address (param);
1333   if (TREE_CODE (base) != MEM_REF
1334       || TREE_CODE (TREE_OPERAND (base, 0)) != SSA_NAME
1335       || !SSA_NAME_IS_DEFAULT_DEF (TREE_OPERAND (base, 0)))
1336     return -1;
1337   tree p = SSA_NAME_VAR (TREE_OPERAND (base, 0));
1338   if (TREE_CODE (p) != PARM_DECL)
1339     return -1;
1340   return ipa_get_param_decl_index (fbi->info, p);
1341 }
1342
1343 /* See if statement might disappear after inlining.
1344    0 - means not eliminated
1345    1 - half of statements goes away
1346    2 - for sure it is eliminated.
1347    We are not terribly sophisticated, basically looking for simple abstraction
1348    penalty wrappers.  */
1349
1350 static int
1351 eliminated_by_inlining_prob (ipa_func_body_info *fbi, gimple *stmt)
1352 {
1353   enum gimple_code code = gimple_code (stmt);
1354   enum tree_code rhs_code;
1355
1356   if (!optimize)
1357     return 0;
1358
1359   switch (code)
1360     {
1361     case GIMPLE_RETURN:
1362       return 2;
1363     case GIMPLE_ASSIGN:
1364       if (gimple_num_ops (stmt) != 2)
1365         return 0;
1366
1367       rhs_code = gimple_assign_rhs_code (stmt);
1368
1369       /* Casts of parameters, loads from parameters passed by reference
1370          and stores to return value or parameters are often free after
1371          inlining due to SRA and further combining.
1372          Assume that half of statements goes away.  */
1373       if (CONVERT_EXPR_CODE_P (rhs_code)
1374           || rhs_code == VIEW_CONVERT_EXPR
1375           || rhs_code == ADDR_EXPR
1376           || gimple_assign_rhs_class (stmt) == GIMPLE_SINGLE_RHS)
1377         {
1378           tree rhs = gimple_assign_rhs1 (stmt);
1379           tree lhs = gimple_assign_lhs (stmt);
1380           tree inner_rhs = get_base_address (rhs);
1381           tree inner_lhs = get_base_address (lhs);
1382           bool rhs_free = false;
1383           bool lhs_free = false;
1384
1385           if (!inner_rhs)
1386             inner_rhs = rhs;
1387           if (!inner_lhs)
1388             inner_lhs = lhs;
1389
1390           /* Reads of parameter are expected to be free.  */
1391           if (unmodified_parm (fbi, stmt, inner_rhs, NULL))
1392             rhs_free = true;
1393           /* Match expressions of form &this->field. Those will most likely
1394              combine with something upstream after inlining.  */
1395           else if (TREE_CODE (inner_rhs) == ADDR_EXPR)
1396             {
1397               tree op = get_base_address (TREE_OPERAND (inner_rhs, 0));
1398               if (TREE_CODE (op) == PARM_DECL)
1399                 rhs_free = true;
1400               else if (TREE_CODE (op) == MEM_REF
1401                        && unmodified_parm (fbi, stmt, TREE_OPERAND (op, 0),
1402                                            NULL))
1403                 rhs_free = true;
1404             }
1405
1406           /* When parameter is not SSA register because its address is taken
1407              and it is just copied into one, the statement will be completely
1408              free after inlining (we will copy propagate backward).   */
1409           if (rhs_free && is_gimple_reg (lhs))
1410             return 2;
1411
1412           /* Reads of parameters passed by reference
1413              expected to be free (i.e. optimized out after inlining).  */
1414           if (TREE_CODE (inner_rhs) == MEM_REF
1415               && unmodified_parm (fbi, stmt, TREE_OPERAND (inner_rhs, 0), NULL))
1416             rhs_free = true;
1417
1418           /* Copying parameter passed by reference into gimple register is
1419              probably also going to copy propagate, but we can't be quite
1420              sure.  */
1421           if (rhs_free && is_gimple_reg (lhs))
1422             lhs_free = true;
1423
1424           /* Writes to parameters, parameters passed by value and return value
1425              (either directly or passed via invisible reference) are free.
1426
1427              TODO: We ought to handle testcase like
1428              struct a {int a,b;};
1429              struct a
1430              returnstruct (void)
1431              {
1432              struct a a ={1,2};
1433              return a;
1434              }
1435
1436              This translate into:
1437
1438              returnstruct ()
1439              {
1440              int a$b;
1441              int a$a;
1442              struct a a;
1443              struct a D.2739;
1444
1445              <bb 2>:
1446              D.2739.a = 1;
1447              D.2739.b = 2;
1448              return D.2739;
1449
1450              }
1451              For that we either need to copy ipa-split logic detecting writes
1452              to return value.  */
1453           if (TREE_CODE (inner_lhs) == PARM_DECL
1454               || TREE_CODE (inner_lhs) == RESULT_DECL
1455               || (TREE_CODE (inner_lhs) == MEM_REF
1456                   && (unmodified_parm (fbi, stmt, TREE_OPERAND (inner_lhs, 0),
1457                                        NULL)
1458                       || (TREE_CODE (TREE_OPERAND (inner_lhs, 0)) == SSA_NAME
1459                           && SSA_NAME_VAR (TREE_OPERAND (inner_lhs, 0))
1460                           && TREE_CODE (SSA_NAME_VAR (TREE_OPERAND
1461                                                       (inner_lhs,
1462                                                        0))) == RESULT_DECL))))
1463             lhs_free = true;
1464           if (lhs_free
1465               && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
1466             rhs_free = true;
1467           if (lhs_free && rhs_free)
1468             return 1;
1469         }
1470       return 0;
1471     default:
1472       return 0;
1473     }
1474 }
1475
1476 /* Analyze EXPR if it represents a series of simple operations performed on
1477    a function parameter and return true if so.  FBI, STMT, EXPR, INDEX_P and
1478    AGGPOS have the same meaning like in unmodified_parm_or_parm_agg_item.
1479    Type of the parameter or load from an aggregate via the parameter is
1480    stored in *TYPE_P.  Operations on the parameter are recorded to
1481    PARAM_OPS_P if it is not NULL.  */
1482
1483 static bool
1484 decompose_param_expr (struct ipa_func_body_info *fbi,
1485                       gimple *stmt, tree expr,
1486                       int *index_p, tree *type_p,
1487                       struct agg_position_info *aggpos,
1488                       expr_eval_ops *param_ops_p = NULL)
1489 {
1490   int op_limit = opt_for_fn (fbi->node->decl, param_ipa_max_param_expr_ops);
1491   int op_count = 0;
1492
1493   if (param_ops_p)
1494     *param_ops_p = NULL;
1495
1496   while (true)
1497     {
1498       expr_eval_op eval_op;
1499       unsigned rhs_count;
1500       unsigned cst_count = 0;
1501
1502       if (unmodified_parm_or_parm_agg_item (fbi, stmt, expr, index_p, NULL,
1503                                             aggpos))
1504         {
1505           tree type = TREE_TYPE (expr);
1506
1507           if (aggpos->agg_contents)
1508             {
1509               /* Stop if containing bit-field.  */
1510               if (TREE_CODE (expr) == BIT_FIELD_REF
1511                   || contains_bitfld_component_ref_p (expr))
1512                 break;
1513             }
1514
1515           *type_p = type;
1516           return true;
1517         }
1518
1519       if (TREE_CODE (expr) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (expr))
1520         break;
1521       stmt = SSA_NAME_DEF_STMT (expr);
1522
1523       if (gcall *call = dyn_cast <gcall *> (stmt))
1524         {
1525           int flags = gimple_call_return_flags (call);
1526           if (!(flags & ERF_RETURNS_ARG))
1527             goto fail;
1528           int arg = flags & ERF_RETURN_ARG_MASK;
1529           if (arg >= (int)gimple_call_num_args (call))
1530             goto fail;
1531           expr = gimple_call_arg (stmt, arg);
1532           continue;
1533         }
1534
1535       if (!is_gimple_assign (stmt = SSA_NAME_DEF_STMT (expr)))
1536         break;
1537
1538       switch (gimple_assign_rhs_class (stmt))
1539         {
1540         case GIMPLE_SINGLE_RHS:
1541           expr = gimple_assign_rhs1 (stmt);
1542           continue;
1543
1544         case GIMPLE_UNARY_RHS:
1545           rhs_count = 1;
1546           break;
1547
1548         case GIMPLE_BINARY_RHS:
1549           rhs_count = 2;
1550           break;
1551
1552         case GIMPLE_TERNARY_RHS:
1553           rhs_count = 3;
1554           break;
1555
1556         default:
1557           goto fail;
1558         }
1559
1560       /* Stop if expression is too complex.  */
1561       if (op_count++ == op_limit)
1562         break;
1563
1564       if (param_ops_p)
1565         {
1566           eval_op.code = gimple_assign_rhs_code (stmt);
1567           eval_op.type = TREE_TYPE (gimple_assign_lhs (stmt));
1568           eval_op.val[0] = NULL_TREE;
1569           eval_op.val[1] = NULL_TREE;
1570         }
1571
1572       expr = NULL_TREE;
1573       for (unsigned i = 0; i < rhs_count; i++)
1574         {
1575           tree op = gimple_op (stmt, i + 1);
1576
1577           gcc_assert (op && !TYPE_P (op));
1578           if (is_gimple_ip_invariant (op))
1579             {
1580               if (++cst_count == rhs_count)
1581                 goto fail;
1582
1583               eval_op.val[cst_count - 1] = op;
1584             }
1585           else if (!expr)
1586             {
1587               /* Found a non-constant operand, and record its index in rhs
1588                  operands.  */
1589               eval_op.index = i;
1590               expr = op;
1591             }
1592           else
1593             {
1594               /* Found more than one non-constant operands.  */
1595               goto fail;
1596             }
1597         }
1598
1599       if (param_ops_p)
1600         vec_safe_insert (*param_ops_p, 0, eval_op);
1601     }
1602
1603   /* Failed to decompose, free resource and return.  */
1604 fail:
1605   if (param_ops_p)
1606     vec_free (*param_ops_p);
1607
1608   return false;
1609 }
1610
1611 /* Record to SUMMARY that PARM is used by builtin_constant_p.  */
1612
1613 static void
1614 add_builtin_constant_p_parm (class ipa_fn_summary *summary, int parm)
1615 {
1616   int ip;
1617
1618   /* Avoid duplicates.  */
1619   for (unsigned int i = 0;
1620        summary->builtin_constant_p_parms.iterate (i, &ip); i++)
1621     if (ip == parm)
1622       return;
1623   summary->builtin_constant_p_parms.safe_push (parm);
1624 }
1625
1626 /* If BB ends by a conditional we can turn into predicates, attach corresponding
1627    predicates to the CFG edges.   */
1628
1629 static void
1630 set_cond_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1631                                    class ipa_fn_summary *summary,
1632                                    class ipa_node_params *params_summary,
1633                                    basic_block bb)
1634 {
1635   tree op, op2;
1636   int index;
1637   struct agg_position_info aggpos;
1638   enum tree_code code, inverted_code;
1639   edge e;
1640   edge_iterator ei;
1641   gimple *set_stmt;
1642   tree param_type;
1643   expr_eval_ops param_ops;
1644
1645   gcond *last = safe_dyn_cast <gcond *> (*gsi_last_bb (bb));
1646   if (!last)
1647     return;
1648   if (!is_gimple_ip_invariant (gimple_cond_rhs (last)))
1649     return;
1650   op = gimple_cond_lhs (last);
1651
1652   if (decompose_param_expr (fbi, last, op, &index, &param_type, &aggpos,
1653                             &param_ops))
1654     {
1655       code = gimple_cond_code (last);
1656       inverted_code = invert_tree_comparison (code, HONOR_NANS (op));
1657
1658       FOR_EACH_EDGE (e, ei, bb->succs)
1659         {
1660           enum tree_code this_code = (e->flags & EDGE_TRUE_VALUE
1661                                       ? code : inverted_code);
1662           /* invert_tree_comparison will return ERROR_MARK on FP
1663              comparisons that are not EQ/NE instead of returning proper
1664              unordered one.  Be sure it is not confused with NON_CONSTANT.
1665
1666              And if the edge's target is the final block of diamond CFG graph
1667              of this conditional statement, we do not need to compute
1668              predicate for the edge because the final block's predicate must
1669              be at least as that of the first block of the statement.  */
1670           if (this_code != ERROR_MARK
1671               && !dominated_by_p (CDI_POST_DOMINATORS, bb, e->dest))
1672             {
1673               ipa_predicate p
1674                 = add_condition (summary, params_summary, index,
1675                                  param_type, &aggpos,
1676                                  this_code, gimple_cond_rhs (last), param_ops);
1677               e->aux = edge_predicate_pool.allocate ();
1678               *(ipa_predicate *) e->aux = p;
1679             }
1680         }
1681       vec_free (param_ops);
1682       return;
1683     }
1684
1685   if (TREE_CODE (op) != SSA_NAME)
1686     return;
1687   /* Special case
1688      if (builtin_constant_p (op))
1689      constant_code
1690      else
1691      nonconstant_code.
1692      Here we can predicate nonconstant_code.  We can't
1693      really handle constant_code since we have no predicate
1694      for this and also the constant code is not known to be
1695      optimized away when inliner doesn't see operand is constant.
1696      Other optimizers might think otherwise.  */
1697   if (gimple_cond_code (last) != NE_EXPR
1698       || !integer_zerop (gimple_cond_rhs (last)))
1699     return;
1700   set_stmt = SSA_NAME_DEF_STMT (op);
1701   if (!gimple_call_builtin_p (set_stmt, BUILT_IN_CONSTANT_P)
1702       || gimple_call_num_args (set_stmt) != 1)
1703     return;
1704   op2 = gimple_call_arg (set_stmt, 0);
1705   if (!decompose_param_expr (fbi, set_stmt, op2, &index, &param_type, &aggpos))
1706     return;
1707   if (!aggpos.by_ref)
1708     add_builtin_constant_p_parm (summary, index);
1709   FOR_EACH_EDGE (e, ei, bb->succs) if (e->flags & EDGE_FALSE_VALUE)
1710     {
1711       ipa_predicate p = add_condition (summary, params_summary, index,
1712                                    param_type, &aggpos,
1713                                    ipa_predicate::is_not_constant, NULL_TREE);
1714       e->aux = edge_predicate_pool.allocate ();
1715       *(ipa_predicate *) e->aux = p;
1716     }
1717 }
1718
1719
1720 /* If BB ends by a switch we can turn into predicates, attach corresponding
1721    predicates to the CFG edges.   */
1722
1723 static void
1724 set_switch_stmt_execution_predicate (struct ipa_func_body_info *fbi,
1725                                      class ipa_fn_summary *summary,
1726                                      class ipa_node_params *params_summary,
1727                                      basic_block bb)
1728 {
1729   tree op;
1730   int index;
1731   struct agg_position_info aggpos;
1732   edge e;
1733   edge_iterator ei;
1734   size_t n;
1735   size_t case_idx;
1736   tree param_type;
1737   expr_eval_ops param_ops;
1738
1739   gswitch *last = safe_dyn_cast <gswitch *> (*gsi_last_bb (bb));
1740   if (!last)
1741     return;
1742   op = gimple_switch_index (last);
1743   if (!decompose_param_expr (fbi, last, op, &index, &param_type, &aggpos,
1744                              &param_ops))
1745     return;
1746
1747   auto_vec<std::pair<tree, tree> > ranges;
1748   tree type = TREE_TYPE (op);
1749   int bound_limit = opt_for_fn (fbi->node->decl,
1750                                 param_ipa_max_switch_predicate_bounds);
1751   int bound_count = 0;
1752   // This can safely be an integer range, as switches can only hold
1753   // integers.
1754   int_range<2> vr;
1755
1756   get_range_query (cfun)->range_of_expr (vr, op);
1757   if (vr.undefined_p ())
1758     vr.set_varying (TREE_TYPE (op));
1759   tree vr_min, vr_max;
1760   // TODO: This entire function could use a rewrite to use the irange
1761   // API, instead of trying to recreate its intersection/union logic.
1762   // Any use of get_legacy_range() is a serious code smell.
1763   value_range_kind vr_type = get_legacy_range (vr, vr_min, vr_max);
1764   wide_int vr_wmin = wi::to_wide (vr_min);
1765   wide_int vr_wmax = wi::to_wide (vr_max);
1766
1767   FOR_EACH_EDGE (e, ei, bb->succs)
1768     {
1769       e->aux = edge_predicate_pool.allocate ();
1770       *(ipa_predicate *) e->aux = false;
1771     }
1772
1773   e = gimple_switch_edge (cfun, last, 0);
1774   /* Set BOUND_COUNT to maximum count to bypass computing predicate for
1775      default case if its target basic block is in convergence point of all
1776      switch cases, which can be determined by checking whether it
1777      post-dominates the switch statement.  */
1778   if (dominated_by_p (CDI_POST_DOMINATORS, bb, e->dest))
1779     bound_count = INT_MAX;
1780
1781   n = gimple_switch_num_labels (last);
1782   for (case_idx = 1; case_idx < n; ++case_idx)
1783     {
1784       tree cl = gimple_switch_label (last, case_idx);
1785       tree min = CASE_LOW (cl);
1786       tree max = CASE_HIGH (cl);
1787       ipa_predicate p;
1788
1789       e = gimple_switch_edge (cfun, last, case_idx);
1790
1791       /* The case value might not have same type as switch expression,
1792          extend the value based on the expression type.  */
1793       if (TREE_TYPE (min) != type)
1794         min = wide_int_to_tree (type, wi::to_wide (min));
1795
1796       if (!max)
1797         max = min;
1798       else if (TREE_TYPE (max) != type)
1799         max = wide_int_to_tree (type, wi::to_wide (max));
1800
1801       /* The case's target basic block is in convergence point of all switch
1802          cases, its predicate should be at least as that of the switch
1803          statement.  */
1804       if (dominated_by_p (CDI_POST_DOMINATORS, bb, e->dest))
1805         p = true;
1806       else if (min == max)
1807         p = add_condition (summary, params_summary, index, param_type,
1808                            &aggpos, EQ_EXPR, min, param_ops);
1809       else
1810         {
1811           ipa_predicate p1, p2;
1812           p1 = add_condition (summary, params_summary, index, param_type,
1813                               &aggpos, GE_EXPR, min, param_ops);
1814           p2 = add_condition (summary,  params_summary,index, param_type,
1815                               &aggpos, LE_EXPR, max, param_ops);
1816           p = p1 & p2;
1817         }
1818       *(ipa_predicate *) e->aux
1819         = p.or_with (summary->conds, *(ipa_predicate *) e->aux);
1820
1821       /* If there are too many disjoint case ranges, predicate for default
1822          case might become too complicated.  So add a limit here.  */
1823       if (bound_count > bound_limit)
1824         continue;
1825
1826       bool new_range = true;
1827
1828       if (!ranges.is_empty ())
1829         {
1830           wide_int curr_wmin = wi::to_wide (min);
1831           wide_int last_wmax = wi::to_wide (ranges.last ().second);
1832
1833           /* Merge case ranges if they are continuous.  */
1834           if (curr_wmin == last_wmax + 1)
1835             new_range = false;
1836           else if (vr_type == VR_ANTI_RANGE)
1837             {
1838               /* If two disjoint case ranges can be connected by anti-range
1839                  of switch index, combine them to one range.  */
1840               if (wi::lt_p (vr_wmax, curr_wmin - 1, TYPE_SIGN (type)))
1841                 vr_type = VR_UNDEFINED;
1842               else if (wi::le_p (vr_wmin, last_wmax + 1, TYPE_SIGN (type)))
1843                 new_range = false;
1844             }
1845         }
1846
1847       /* Create/extend a case range.  And we count endpoints of range set,
1848          this number nearly equals to number of conditions that we will create
1849          for predicate of default case.  */
1850       if (new_range)
1851         {
1852           bound_count += (min == max) ? 1 : 2;
1853           ranges.safe_push (std::make_pair (min, max));
1854         }
1855       else
1856         {
1857           bound_count += (ranges.last ().first == ranges.last ().second);
1858           ranges.last ().second = max;
1859         }
1860     }
1861
1862   e = gimple_switch_edge (cfun, last, 0);
1863   if (bound_count > bound_limit)
1864     {
1865       *(ipa_predicate *) e->aux = true;
1866       vec_free (param_ops);
1867       return;
1868     }
1869
1870   ipa_predicate p_seg = true;
1871   ipa_predicate p_all = false;
1872
1873   if (vr_type != VR_RANGE)
1874     {
1875       vr_wmin = wi::to_wide (TYPE_MIN_VALUE (type));
1876       vr_wmax = wi::to_wide (TYPE_MAX_VALUE (type));
1877     }
1878
1879   /* Construct predicate to represent default range set that is negation of
1880      all case ranges.  Case range is classified as containing single/non-single
1881      values.  Suppose a piece of case ranges in the following.
1882
1883                 [D1...D2]  [S1] ... [Sn]  [D3...D4]
1884
1885      To represent default case's range sets between two non-single value
1886      case ranges (From D2 to D3), we construct predicate as:
1887
1888               D2 < x < D3 && x != S1 && ... && x != Sn
1889    */
1890   for (size_t i = 0; i < ranges.length (); i++)
1891     {
1892       tree min = ranges[i].first;
1893       tree max = ranges[i].second;
1894
1895       if (min == max)
1896         p_seg &= add_condition (summary, params_summary, index,
1897                                 param_type, &aggpos, NE_EXPR,
1898                                 min, param_ops);
1899       else
1900         {
1901           /* Do not create sub-predicate for range that is beyond low bound
1902              of switch index.  */
1903           if (wi::lt_p (vr_wmin, wi::to_wide (min), TYPE_SIGN (type)))
1904             {
1905               p_seg &= add_condition (summary, params_summary, index,
1906                                       param_type, &aggpos,
1907                                       LT_EXPR, min, param_ops);
1908               p_all = p_all.or_with (summary->conds, p_seg);
1909             }
1910
1911           /* Do not create sub-predicate for range that is beyond up bound
1912              of switch index.  */
1913           if (wi::le_p (vr_wmax, wi::to_wide (max), TYPE_SIGN (type)))
1914             {
1915               p_seg = false;
1916               break;
1917             }
1918
1919           p_seg = add_condition (summary, params_summary, index,
1920                                  param_type, &aggpos, GT_EXPR,
1921                                  max, param_ops);
1922         }
1923     }
1924
1925   p_all = p_all.or_with (summary->conds, p_seg);
1926   *(ipa_predicate *) e->aux
1927     = p_all.or_with (summary->conds, *(ipa_predicate *) e->aux);
1928
1929   vec_free (param_ops);
1930 }
1931
1932
1933 /* For each BB in NODE attach to its AUX pointer predicate under
1934    which it is executable.  */
1935
1936 static void
1937 compute_bb_predicates (struct ipa_func_body_info *fbi,
1938                        struct cgraph_node *node,
1939                        class ipa_fn_summary *summary,
1940                        class ipa_node_params *params_summary)
1941 {
1942   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
1943   bool done = false;
1944   basic_block bb;
1945
1946   FOR_EACH_BB_FN (bb, my_function)
1947     {
1948       set_cond_stmt_execution_predicate (fbi, summary, params_summary, bb);
1949       set_switch_stmt_execution_predicate (fbi, summary, params_summary, bb);
1950     }
1951
1952   /* Entry block is always executable.  */
1953   ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux
1954     = edge_predicate_pool.allocate ();
1955   *(ipa_predicate *) ENTRY_BLOCK_PTR_FOR_FN (my_function)->aux = true;
1956
1957   /* A simple dataflow propagation of predicates forward in the CFG.
1958      TODO: work in reverse postorder.  */
1959   while (!done)
1960     {
1961       done = true;
1962       FOR_EACH_BB_FN (bb, my_function)
1963         {
1964           ipa_predicate p = false;
1965           edge e;
1966           edge_iterator ei;
1967           FOR_EACH_EDGE (e, ei, bb->preds)
1968             {
1969               if (e->src->aux)
1970                 {
1971                   ipa_predicate this_bb_predicate
1972                     = *(ipa_predicate *) e->src->aux;
1973                   if (e->aux)
1974                     this_bb_predicate &= (*(ipa_predicate *) e->aux);
1975                   p = p.or_with (summary->conds, this_bb_predicate);
1976                   if (p == true)
1977                     break;
1978                 }
1979             }
1980           if (p != false)
1981             {
1982               basic_block pdom_bb;
1983
1984               if (!bb->aux)
1985                 {
1986                   done = false;
1987                   bb->aux = edge_predicate_pool.allocate ();
1988                   *((ipa_predicate *) bb->aux) = p;
1989                 }
1990               else if (p != *(ipa_predicate *) bb->aux)
1991                 {
1992                   /* This OR operation is needed to ensure monotonous data flow
1993                      in the case we hit the limit on number of clauses and the
1994                      and/or operations above give approximate answers.  */
1995                   p = p.or_with (summary->conds, *(ipa_predicate *)bb->aux);
1996                   if (p != *(ipa_predicate *)bb->aux)
1997                     {
1998                       done = false;
1999                       *((ipa_predicate *)bb->aux) = p;
2000                     }
2001                 }
2002
2003               /* For switch/if statement, we can OR-combine predicates of all
2004                  its cases/branches to get predicate for basic block in their
2005                  convergence point, but sometimes this will generate very
2006                  complicated predicate.  Actually, we can get simplified
2007                  predicate in another way by using the fact that predicate
2008                  for a basic block must also hold true for its post dominators.
2009                  To be specific, basic block in convergence point of
2010                  conditional statement should include predicate of the
2011                  statement.  */
2012               pdom_bb = get_immediate_dominator (CDI_POST_DOMINATORS, bb);
2013               if (pdom_bb == EXIT_BLOCK_PTR_FOR_FN (my_function) || !pdom_bb)
2014                 ;
2015               else if (!pdom_bb->aux)
2016                 {
2017                   done = false;
2018                   pdom_bb->aux = edge_predicate_pool.allocate ();
2019                   *((ipa_predicate *)pdom_bb->aux) = p;
2020                 }
2021               else if (p != *(ipa_predicate *)pdom_bb->aux)
2022                 {
2023                   p = p.or_with (summary->conds,
2024                                  *(ipa_predicate *)pdom_bb->aux);
2025                   if (p != *(ipa_predicate *)pdom_bb->aux)
2026                     {
2027                       done = false;
2028                       *((ipa_predicate *)pdom_bb->aux) = p;
2029                     }
2030                 }
2031             }
2032         }
2033     }
2034 }
2035
2036
2037 /* Return predicate specifying when the STMT might have result that is not
2038    a compile time constant.  */
2039
2040 static ipa_predicate
2041 will_be_nonconstant_expr_predicate (ipa_func_body_info *fbi,
2042                                     class ipa_fn_summary *summary,
2043                                     class ipa_node_params *params_summary,
2044                                     tree expr,
2045                                     vec<ipa_predicate> nonconstant_names)
2046 {
2047   tree parm;
2048   int index;
2049
2050   while (UNARY_CLASS_P (expr))
2051     expr = TREE_OPERAND (expr, 0);
2052
2053   parm = unmodified_parm (fbi, NULL, expr, NULL);
2054   if (parm && (index = ipa_get_param_decl_index (fbi->info, parm)) >= 0)
2055     return add_condition (summary, params_summary, index, TREE_TYPE (parm), NULL,
2056                           ipa_predicate::changed, NULL_TREE);
2057   if (is_gimple_min_invariant (expr))
2058     return false;
2059   if (TREE_CODE (expr) == SSA_NAME)
2060     return nonconstant_names[SSA_NAME_VERSION (expr)];
2061   if (BINARY_CLASS_P (expr) || COMPARISON_CLASS_P (expr))
2062     {
2063       ipa_predicate p1
2064         = will_be_nonconstant_expr_predicate (fbi, summary,
2065                                               params_summary,
2066                                               TREE_OPERAND (expr, 0),
2067                                               nonconstant_names);
2068       if (p1 == true)
2069         return p1;
2070
2071       ipa_predicate p2
2072         = will_be_nonconstant_expr_predicate (fbi, summary,
2073                                               params_summary,
2074                                               TREE_OPERAND (expr, 1),
2075                                               nonconstant_names);
2076       return p1.or_with (summary->conds, p2);
2077     }
2078   else if (TREE_CODE (expr) == COND_EXPR)
2079     {
2080       ipa_predicate p1
2081         = will_be_nonconstant_expr_predicate (fbi, summary,
2082                                               params_summary,
2083                                               TREE_OPERAND (expr, 0),
2084                                               nonconstant_names);
2085       if (p1 == true)
2086         return p1;
2087
2088       ipa_predicate p2
2089         = will_be_nonconstant_expr_predicate (fbi, summary,
2090                                               params_summary,
2091                                               TREE_OPERAND (expr, 1),
2092                                               nonconstant_names);
2093       if (p2 == true)
2094         return p2;
2095       p1 = p1.or_with (summary->conds, p2);
2096       p2 = will_be_nonconstant_expr_predicate (fbi, summary,
2097                                                params_summary,
2098                                                TREE_OPERAND (expr, 2),
2099                                                nonconstant_names);
2100       return p2.or_with (summary->conds, p1);
2101     }
2102   else if (TREE_CODE (expr) == CALL_EXPR)
2103     return true;
2104   else
2105     {
2106       debug_tree (expr);
2107       gcc_unreachable ();
2108     }
2109 }
2110
2111
2112 /* Return predicate specifying when the STMT might have result that is not
2113    a compile time constant.  */
2114
2115 static ipa_predicate
2116 will_be_nonconstant_predicate (struct ipa_func_body_info *fbi,
2117                                class ipa_fn_summary *summary,
2118                                class ipa_node_params *params_summary,
2119                                gimple *stmt,
2120                                vec<ipa_predicate> nonconstant_names)
2121 {
2122   ipa_predicate p = true;
2123   ssa_op_iter iter;
2124   tree use;
2125   tree param_type = NULL_TREE;
2126   ipa_predicate op_non_const;
2127   bool is_load;
2128   int base_index;
2129   struct agg_position_info aggpos;
2130
2131   /* What statements might be optimized away
2132      when their arguments are constant.  */
2133   if (gimple_code (stmt) != GIMPLE_ASSIGN
2134       && gimple_code (stmt) != GIMPLE_COND
2135       && gimple_code (stmt) != GIMPLE_SWITCH
2136       && (gimple_code (stmt) != GIMPLE_CALL
2137           || !(gimple_call_flags (stmt) & ECF_CONST)))
2138     return p;
2139
2140   /* Stores will stay anyway.  */
2141   if (gimple_store_p (stmt))
2142     return p;
2143
2144   is_load = gimple_assign_load_p (stmt);
2145
2146   /* Loads can be optimized when the value is known.  */
2147   if (is_load)
2148     {
2149       tree op = gimple_assign_rhs1 (stmt);
2150       if (!decompose_param_expr (fbi, stmt, op, &base_index, &param_type,
2151                                  &aggpos))
2152         return p;
2153     }
2154   else
2155     base_index = -1;
2156
2157   /* See if we understand all operands before we start
2158      adding conditionals.  */
2159   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2160     {
2161       tree parm = unmodified_parm (fbi, stmt, use, NULL);
2162       /* For arguments we can build a condition.  */
2163       if (parm && ipa_get_param_decl_index (fbi->info, parm) >= 0)
2164         continue;
2165       if (TREE_CODE (use) != SSA_NAME)
2166         return p;
2167       /* If we know when operand is constant,
2168          we still can say something useful.  */
2169       if (nonconstant_names[SSA_NAME_VERSION (use)] != true)
2170         continue;
2171       return p;
2172     }
2173
2174   if (is_load)
2175     op_non_const =
2176       add_condition (summary, params_summary,
2177                      base_index, param_type, &aggpos,
2178                      ipa_predicate::changed, NULL_TREE);
2179   else
2180     op_non_const = false;
2181   FOR_EACH_SSA_TREE_OPERAND (use, stmt, iter, SSA_OP_USE)
2182     {
2183       tree parm = unmodified_parm (fbi, stmt, use, NULL);
2184       int index;
2185
2186       if (parm && (index = ipa_get_param_decl_index (fbi->info, parm)) >= 0)
2187         {
2188           if (index != base_index)
2189             p = add_condition (summary, params_summary, index,
2190                                TREE_TYPE (parm), NULL,
2191                                ipa_predicate::changed, NULL_TREE);
2192           else
2193             continue;
2194         }
2195       else
2196         p = nonconstant_names[SSA_NAME_VERSION (use)];
2197       op_non_const = p.or_with (summary->conds, op_non_const);
2198     }
2199   if ((gimple_code (stmt) == GIMPLE_ASSIGN || gimple_code (stmt) == GIMPLE_CALL)
2200       && gimple_op (stmt, 0)
2201       && TREE_CODE (gimple_op (stmt, 0)) == SSA_NAME)
2202     nonconstant_names[SSA_NAME_VERSION (gimple_op (stmt, 0))]
2203       = op_non_const;
2204   return op_non_const;
2205 }
2206
2207 struct record_modified_bb_info
2208 {
2209   tree op;
2210   bitmap bb_set;
2211   gimple *stmt;
2212 };
2213
2214 /* Value is initialized in INIT_BB and used in USE_BB.  We want to compute
2215    probability how often it changes between USE_BB.
2216    INIT_BB->count/USE_BB->count is an estimate, but if INIT_BB
2217    is in different loop nest, we can do better.
2218    This is all just estimate.  In theory we look for minimal cut separating
2219    INIT_BB and USE_BB, but we only want to anticipate loop invariant motion
2220    anyway.  */
2221
2222 static basic_block
2223 get_minimal_bb (basic_block init_bb, basic_block use_bb)
2224 {
2225   class loop *l = find_common_loop (init_bb->loop_father, use_bb->loop_father);
2226   if (l && l->header->count < init_bb->count)
2227     return l->header;
2228   return init_bb;
2229 }
2230
2231 /* Callback of walk_aliased_vdefs.  Records basic blocks where the value may be
2232    set except for info->stmt.  */
2233
2234 static bool
2235 record_modified (ao_ref *ao ATTRIBUTE_UNUSED, tree vdef, void *data)
2236 {
2237   struct record_modified_bb_info *info =
2238     (struct record_modified_bb_info *) data;
2239   if (SSA_NAME_DEF_STMT (vdef) == info->stmt)
2240     return false;
2241   if (gimple_clobber_p (SSA_NAME_DEF_STMT (vdef)))
2242     return false;
2243   bitmap_set_bit (info->bb_set,
2244                   SSA_NAME_IS_DEFAULT_DEF (vdef)
2245                   ? ENTRY_BLOCK_PTR_FOR_FN (cfun)->index
2246                   : get_minimal_bb
2247                          (gimple_bb (SSA_NAME_DEF_STMT (vdef)),
2248                           gimple_bb (info->stmt))->index);
2249   if (dump_file)
2250     {
2251       fprintf (dump_file, "     Param ");
2252       print_generic_expr (dump_file, info->op, TDF_SLIM);
2253       fprintf (dump_file, " changed at bb %i, minimal: %i stmt: ",
2254                gimple_bb (SSA_NAME_DEF_STMT (vdef))->index,
2255                get_minimal_bb
2256                          (gimple_bb (SSA_NAME_DEF_STMT (vdef)),
2257                           gimple_bb (info->stmt))->index);
2258       print_gimple_stmt (dump_file, SSA_NAME_DEF_STMT (vdef), 0);
2259     }
2260   return false;
2261 }
2262
2263 /* Return probability (based on REG_BR_PROB_BASE) that I-th parameter of STMT
2264    will change since last invocation of STMT.
2265
2266    Value 0 is reserved for compile time invariants.
2267    For common parameters it is REG_BR_PROB_BASE.  For loop invariants it
2268    ought to be REG_BR_PROB_BASE / estimated_iters.  */
2269
2270 static int
2271 param_change_prob (ipa_func_body_info *fbi, gimple *stmt, int i)
2272 {
2273   tree op = gimple_call_arg (stmt, i);
2274   basic_block bb = gimple_bb (stmt);
2275
2276   if (TREE_CODE (op) == WITH_SIZE_EXPR)
2277     op = TREE_OPERAND (op, 0);
2278
2279   tree base = get_base_address (op);
2280
2281   /* Global invariants never change.  */
2282   if (is_gimple_min_invariant (base))
2283     return 0;
2284
2285   /* We would have to do non-trivial analysis to really work out what
2286      is the probability of value to change (i.e. when init statement
2287      is in a sibling loop of the call).
2288
2289      We do an conservative estimate: when call is executed N times more often
2290      than the statement defining value, we take the frequency 1/N.  */
2291   if (TREE_CODE (base) == SSA_NAME)
2292     {
2293       profile_count init_count;
2294
2295       if (!bb->count.nonzero_p ())
2296         return REG_BR_PROB_BASE;
2297
2298       if (SSA_NAME_IS_DEFAULT_DEF (base))
2299         init_count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
2300       else
2301         init_count = get_minimal_bb
2302                       (gimple_bb (SSA_NAME_DEF_STMT (base)),
2303                        gimple_bb (stmt))->count;
2304
2305       if (init_count < bb->count)
2306         return MAX ((init_count.to_sreal_scale (bb->count)
2307                      * REG_BR_PROB_BASE).to_int (), 1);
2308       return REG_BR_PROB_BASE;
2309     }
2310   else
2311     {
2312       ao_ref refd;
2313       profile_count max = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
2314       struct record_modified_bb_info info;
2315       tree init = ctor_for_folding (base);
2316
2317       if (init != error_mark_node)
2318         return 0;
2319       if (!bb->count.nonzero_p () || fbi->aa_walk_budget == 0)
2320         return REG_BR_PROB_BASE;
2321       if (dump_file)
2322         {
2323           fprintf (dump_file, "     Analyzing param change probability of ");
2324           print_generic_expr (dump_file, op, TDF_SLIM);
2325           fprintf (dump_file, "\n");
2326         }
2327       ao_ref_init (&refd, op);
2328       info.op = op;
2329       info.stmt = stmt;
2330       info.bb_set = BITMAP_ALLOC (NULL);
2331       int walked
2332         = walk_aliased_vdefs (&refd, gimple_vuse (stmt), record_modified, &info,
2333                               NULL, NULL, fbi->aa_walk_budget);
2334       if (walked > 0)
2335         fbi->aa_walk_budget -= walked;
2336       if (walked < 0 || bitmap_bit_p (info.bb_set, bb->index))
2337         {
2338           if (walked < 0)
2339             fbi->aa_walk_budget = 0;
2340           if (dump_file)
2341             {
2342               if (walked < 0)
2343                 fprintf (dump_file, "     Ran out of AA walking budget.\n");
2344               else
2345                 fprintf (dump_file, "     Set in same BB as used.\n");
2346             }
2347           BITMAP_FREE (info.bb_set);
2348           return REG_BR_PROB_BASE;
2349         }
2350
2351       bitmap_iterator bi;
2352       unsigned index;
2353       /* Lookup the most frequent update of the value and believe that
2354          it dominates all the other; precise analysis here is difficult.  */
2355       EXECUTE_IF_SET_IN_BITMAP (info.bb_set, 0, index, bi)
2356         max = max.max (BASIC_BLOCK_FOR_FN (cfun, index)->count);
2357       if (dump_file)
2358         {
2359           fprintf (dump_file, "     Set with count ");
2360           max.dump (dump_file);
2361           fprintf (dump_file, " and used with count ");
2362           bb->count.dump (dump_file);
2363           fprintf (dump_file, " freq %f\n",
2364                    max.to_sreal_scale (bb->count).to_double ());
2365         }
2366
2367       BITMAP_FREE (info.bb_set);
2368       if (max < bb->count)
2369         return MAX ((max.to_sreal_scale (bb->count)
2370                      * REG_BR_PROB_BASE).to_int (), 1);
2371       return REG_BR_PROB_BASE;
2372     }
2373 }
2374
2375 /* Find whether a basic block BB is the final block of a (half) diamond CFG
2376    sub-graph and if the predicate the condition depends on is known.  If so,
2377    return true and store the pointer the predicate in *P.  */
2378
2379 static bool
2380 phi_result_unknown_predicate (ipa_func_body_info *fbi,
2381                               ipa_fn_summary *summary,
2382                               class ipa_node_params *params_summary,
2383                               basic_block bb,
2384                               ipa_predicate *p,
2385                               vec<ipa_predicate> nonconstant_names)
2386 {
2387   edge e;
2388   edge_iterator ei;
2389   basic_block first_bb = NULL;
2390
2391   if (single_pred_p (bb))
2392     {
2393       *p = false;
2394       return true;
2395     }
2396
2397   FOR_EACH_EDGE (e, ei, bb->preds)
2398     {
2399       if (single_succ_p (e->src))
2400         {
2401           if (!single_pred_p (e->src))
2402             return false;
2403           if (!first_bb)
2404             first_bb = single_pred (e->src);
2405           else if (single_pred (e->src) != first_bb)
2406             return false;
2407         }
2408       else
2409         {
2410           if (!first_bb)
2411             first_bb = e->src;
2412           else if (e->src != first_bb)
2413             return false;
2414         }
2415     }
2416
2417   if (!first_bb)
2418     return false;
2419
2420   gcond *stmt = safe_dyn_cast <gcond *> (*gsi_last_bb (first_bb));
2421   if (!stmt
2422       || !is_gimple_ip_invariant (gimple_cond_rhs (stmt)))
2423     return false;
2424
2425   *p = will_be_nonconstant_expr_predicate (fbi, summary, params_summary,
2426                                            gimple_cond_lhs (stmt),
2427                                            nonconstant_names);
2428   if (*p == true)
2429     return false;
2430   else
2431     return true;
2432 }
2433
2434 /* Given a PHI statement in a function described by inline properties SUMMARY
2435    and *P being the predicate describing whether the selected PHI argument is
2436    known, store a predicate for the result of the PHI statement into
2437    NONCONSTANT_NAMES, if possible.  */
2438
2439 static void
2440 predicate_for_phi_result (class ipa_fn_summary *summary, gphi *phi,
2441                           ipa_predicate *p,
2442                           vec<ipa_predicate> nonconstant_names)
2443 {
2444   unsigned i;
2445
2446   for (i = 0; i < gimple_phi_num_args (phi); i++)
2447     {
2448       tree arg = gimple_phi_arg (phi, i)->def;
2449       if (!is_gimple_min_invariant (arg))
2450         {
2451           gcc_assert (TREE_CODE (arg) == SSA_NAME);
2452           *p = p->or_with (summary->conds,
2453                            nonconstant_names[SSA_NAME_VERSION (arg)]);
2454           if (*p == true)
2455             return;
2456         }
2457     }
2458
2459   if (dump_file && (dump_flags & TDF_DETAILS))
2460     {
2461       fprintf (dump_file, "\t\tphi predicate: ");
2462       p->dump (dump_file, summary->conds);
2463     }
2464   nonconstant_names[SSA_NAME_VERSION (gimple_phi_result (phi))] = *p;
2465 }
2466
2467 /* For a typical usage of __builtin_expect (a<b, 1), we
2468    may introduce an extra relation stmt:
2469    With the builtin, we have
2470      t1 = a <= b;
2471      t2 = (long int) t1;
2472      t3 = __builtin_expect (t2, 1);
2473      if (t3 != 0)
2474        goto ...
2475    Without the builtin, we have
2476      if (a<=b)
2477        goto...
2478    This affects the size/time estimation and may have
2479    an impact on the earlier inlining.
2480    Here find this pattern and fix it up later.  */
2481
2482 static gimple *
2483 find_foldable_builtin_expect (basic_block bb)
2484 {
2485   gimple_stmt_iterator bsi;
2486
2487   for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
2488     {
2489       gimple *stmt = gsi_stmt (bsi);
2490       if (gimple_call_builtin_p (stmt, BUILT_IN_EXPECT)
2491           || gimple_call_builtin_p (stmt, BUILT_IN_EXPECT_WITH_PROBABILITY)
2492           || gimple_call_internal_p (stmt, IFN_BUILTIN_EXPECT))
2493         {
2494           tree var = gimple_call_lhs (stmt);
2495           tree arg = gimple_call_arg (stmt, 0);
2496           use_operand_p use_p;
2497           gimple *use_stmt;
2498           bool match = false;
2499           bool done = false;
2500
2501           if (!var || !arg)
2502             continue;
2503           gcc_assert (TREE_CODE (var) == SSA_NAME);
2504
2505           while (TREE_CODE (arg) == SSA_NAME)
2506             {
2507               gimple *stmt_tmp = SSA_NAME_DEF_STMT (arg);
2508               if (!is_gimple_assign (stmt_tmp))
2509                 break;
2510               switch (gimple_assign_rhs_code (stmt_tmp))
2511                 {
2512                   case LT_EXPR:
2513                   case LE_EXPR:
2514                   case GT_EXPR:
2515                   case GE_EXPR:
2516                   case EQ_EXPR:
2517                   case NE_EXPR:
2518                     match = true;
2519                     done = true;
2520                     break;
2521                   CASE_CONVERT:
2522                     break;
2523                   default:
2524                     done = true;
2525                     break;
2526                 }
2527               if (done)
2528                 break;
2529               arg = gimple_assign_rhs1 (stmt_tmp);
2530             }
2531
2532           if (match && single_imm_use (var, &use_p, &use_stmt)
2533               && gimple_code (use_stmt) == GIMPLE_COND)
2534             return use_stmt;
2535         }
2536     }
2537   return NULL;
2538 }
2539
2540 /* Return true when the basic blocks contains only clobbers followed by RESX.
2541    Such BBs are kept around to make removal of dead stores possible with
2542    presence of EH and will be optimized out by optimize_clobbers later in the
2543    game.
2544
2545    NEED_EH is used to recurse in case the clobber has non-EH predecessors
2546    that can be clobber only, too.. When it is false, the RESX is not necessary
2547    on the end of basic block.  */
2548
2549 static bool
2550 clobber_only_eh_bb_p (basic_block bb, bool need_eh = true)
2551 {
2552   gimple_stmt_iterator gsi = gsi_last_bb (bb);
2553   edge_iterator ei;
2554   edge e;
2555
2556   if (need_eh)
2557     {
2558       if (gsi_end_p (gsi))
2559         return false;
2560       if (gimple_code (gsi_stmt (gsi)) != GIMPLE_RESX)
2561         return false;
2562       gsi_prev (&gsi);
2563     }
2564   else if (!single_succ_p (bb))
2565     return false;
2566
2567   for (; !gsi_end_p (gsi); gsi_prev (&gsi))
2568     {
2569       gimple *stmt = gsi_stmt (gsi);
2570       if (is_gimple_debug (stmt))
2571         continue;
2572       if (gimple_clobber_p (stmt))
2573         continue;
2574       if (gimple_code (stmt) == GIMPLE_LABEL)
2575         break;
2576       return false;
2577     }
2578
2579   /* See if all predecessors are either throws or clobber only BBs.  */
2580   FOR_EACH_EDGE (e, ei, bb->preds)
2581     if (!(e->flags & EDGE_EH)
2582         && !clobber_only_eh_bb_p (e->src, false))
2583       return false;
2584
2585   return true;
2586 }
2587
2588 /* Return true if STMT compute a floating point expression that may be affected
2589    by -ffast-math and similar flags.  */
2590
2591 static bool
2592 fp_expression_p (gimple *stmt)
2593 {
2594   ssa_op_iter i;
2595   tree op;
2596
2597   FOR_EACH_SSA_TREE_OPERAND (op, stmt, i, SSA_OP_DEF|SSA_OP_USE)
2598     if (FLOAT_TYPE_P (TREE_TYPE (op)))
2599       return true;
2600   return false;
2601 }
2602
2603 /* Return true if T references memory location that is local
2604    for the function (that means, dead after return) or read-only.  */
2605
2606 bool
2607 refs_local_or_readonly_memory_p (tree t)
2608 {
2609   /* Non-escaping memory is fine.  */
2610   t = get_base_address (t);
2611   if ((TREE_CODE (t) == MEM_REF
2612       || TREE_CODE (t) == TARGET_MEM_REF))
2613     return points_to_local_or_readonly_memory_p (TREE_OPERAND (t, 0));
2614
2615   /* Automatic variables are fine.  */
2616   if (DECL_P (t)
2617       && auto_var_in_fn_p (t, current_function_decl))
2618     return true;
2619
2620   /* Read-only variables are fine.  */
2621   if (DECL_P (t) && TREE_READONLY (t))
2622     return true;
2623
2624   return false;
2625 }
2626
2627 /* Return true if T is a pointer pointing to memory location that is local
2628    for the function (that means, dead after return) or read-only.  */
2629
2630 bool
2631 points_to_local_or_readonly_memory_p (tree t)
2632 {
2633   /* See if memory location is clearly invalid.  */
2634   if (integer_zerop (t))
2635     return flag_delete_null_pointer_checks;
2636   if (TREE_CODE (t) == SSA_NAME)
2637     {
2638       /* For IPA passes we can consinder accesses to return slot local
2639          even if it is not local in the sense that memory is dead by
2640          the end of founction.
2641          The outer function will see a store in the call assignment
2642          and thus this will do right thing for all uses of this
2643          function in the current IPA passes (modref, pure/const discovery
2644          and inlining heuristics).  */
2645       if (DECL_RESULT (current_function_decl)
2646           && DECL_BY_REFERENCE (DECL_RESULT (current_function_decl))
2647           && t == ssa_default_def (cfun, DECL_RESULT (current_function_decl)))
2648         return true;
2649       return !ptr_deref_may_alias_global_p (t, false);
2650     }
2651   if (TREE_CODE (t) == ADDR_EXPR)
2652     return refs_local_or_readonly_memory_p (TREE_OPERAND (t, 0));
2653   return false;
2654 }
2655
2656 /* Return true if T is a pointer pointing to memory location that is possible
2657    sra candidate if all functions it is passed to are inlined.  */
2658
2659 static bool
2660 points_to_possible_sra_candidate_p (tree t)
2661 {
2662   if (TREE_CODE (t) != ADDR_EXPR)
2663     return false;
2664
2665   t = get_base_address (TREE_OPERAND (t, 0));
2666
2667   /* Automatic variables are fine.  */
2668   if (DECL_P (t)
2669       && auto_var_in_fn_p (t, current_function_decl))
2670     return true;
2671   return false;
2672 }
2673
2674 /* Analyze function body for NODE.
2675    EARLY indicates run from early optimization pipeline.  */
2676
2677 static void
2678 analyze_function_body (struct cgraph_node *node, bool early)
2679 {
2680   sreal time = opt_for_fn (node->decl, param_uninlined_function_time);
2681   /* Estimate static overhead for function prologue/epilogue and alignment. */
2682   int size = opt_for_fn (node->decl, param_uninlined_function_insns);
2683   /* Benefits are scaled by probability of elimination that is in range
2684      <0,2>.  */
2685   basic_block bb;
2686   struct function *my_function = DECL_STRUCT_FUNCTION (node->decl);
2687   sreal freq;
2688   class ipa_fn_summary *info = ipa_fn_summaries->get_create (node);
2689   ipa_node_params *params_summary
2690     = early ? NULL : ipa_node_params_sum->get (node);
2691   ipa_predicate bb_predicate;
2692   struct ipa_func_body_info fbi;
2693   vec<ipa_predicate> nonconstant_names = vNULL;
2694   int nblocks, n;
2695   int *order;
2696   gimple *fix_builtin_expect_stmt;
2697
2698   gcc_assert (my_function && my_function->cfg);
2699   gcc_assert (cfun == my_function);
2700
2701   memset(&fbi, 0, sizeof(fbi));
2702   vec_free (info->conds);
2703   info->conds = NULL;
2704   info->size_time_table.release ();
2705   info->call_size_time_table.release ();
2706
2707   /* When optimizing and analyzing for IPA inliner, initialize loop optimizer
2708      so we can produce proper inline hints.
2709
2710      When optimizing and analyzing for early inliner, initialize node params
2711      so we can produce correct BB predicates.  */
2712
2713   if (opt_for_fn (node->decl, optimize))
2714     {
2715       calculate_dominance_info (CDI_DOMINATORS);
2716       calculate_dominance_info (CDI_POST_DOMINATORS);
2717       if (!early)
2718         loop_optimizer_init (LOOPS_NORMAL | LOOPS_HAVE_RECORDED_EXITS);
2719       else
2720         {
2721           ipa_check_create_node_params ();
2722           ipa_initialize_node_params (node);
2723         }
2724
2725       if (ipa_node_params_sum)
2726         {
2727           fbi.node = node;
2728           fbi.info = ipa_node_params_sum->get (node);
2729           fbi.bb_infos = vNULL;
2730           fbi.bb_infos.safe_grow_cleared (last_basic_block_for_fn (cfun), true);
2731           fbi.param_count = count_formal_params (node->decl);
2732           fbi.aa_walk_budget = opt_for_fn (node->decl, param_ipa_max_aa_steps);
2733
2734           nonconstant_names.safe_grow_cleared
2735             (SSANAMES (my_function)->length (), true);
2736         }
2737     }
2738
2739   if (dump_file)
2740     fprintf (dump_file, "\nAnalyzing function body size: %s\n",
2741              node->dump_name ());
2742
2743   /* When we run into maximal number of entries, we assign everything to the
2744      constant truth case.  Be sure to have it in list. */
2745   bb_predicate = true;
2746   info->account_size_time (0, 0, bb_predicate, bb_predicate);
2747
2748   bb_predicate = ipa_predicate::not_inlined ();
2749   info->account_size_time (opt_for_fn (node->decl,
2750                                 param_uninlined_function_insns)
2751                            * ipa_fn_summary::size_scale,
2752                            opt_for_fn (node->decl,
2753                                 param_uninlined_function_time),
2754                            bb_predicate,
2755                            bb_predicate);
2756
2757   /* Only look for target information for inlinable functions.  */
2758   bool scan_for_target_info =
2759     info->inlinable
2760     && targetm.target_option.need_ipa_fn_target_info (node->decl,
2761                                                       info->target_info);
2762
2763   if (fbi.info)
2764     compute_bb_predicates (&fbi, node, info, params_summary);
2765   const profile_count entry_count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
2766   order = XNEWVEC (int, n_basic_blocks_for_fn (cfun));
2767   nblocks = pre_and_rev_post_order_compute (NULL, order, false);
2768   for (n = 0; n < nblocks; n++)
2769     {
2770       bb = BASIC_BLOCK_FOR_FN (cfun, order[n]);
2771       freq = bb->count.to_sreal_scale (entry_count);
2772       if (clobber_only_eh_bb_p (bb))
2773         {
2774           if (dump_file && (dump_flags & TDF_DETAILS))
2775             fprintf (dump_file, "\n Ignoring BB %i;"
2776                      " it will be optimized away by cleanup_clobbers\n",
2777                      bb->index);
2778           continue;
2779         }
2780
2781       /* TODO: Obviously predicates can be propagated down across CFG.  */
2782       if (fbi.info)
2783         {
2784           if (bb->aux)
2785             bb_predicate = *(ipa_predicate *)bb->aux;
2786           else
2787             bb_predicate = false;
2788         }
2789       else
2790         bb_predicate = true;
2791
2792       if (dump_file && (dump_flags & TDF_DETAILS))
2793         {
2794           fprintf (dump_file, "\n BB %i predicate:", bb->index);
2795           bb_predicate.dump (dump_file, info->conds);
2796         }
2797
2798       if (fbi.info && nonconstant_names.exists ())
2799         {
2800           ipa_predicate phi_predicate;
2801           bool first_phi = true;
2802
2803           for (gphi_iterator bsi = gsi_start_phis (bb); !gsi_end_p (bsi);
2804                gsi_next (&bsi))
2805             {
2806               if (first_phi
2807                   && !phi_result_unknown_predicate (&fbi, info,
2808                                                     params_summary,
2809                                                     bb,
2810                                                     &phi_predicate,
2811                                                     nonconstant_names))
2812                 break;
2813               first_phi = false;
2814               if (dump_file && (dump_flags & TDF_DETAILS))
2815                 {
2816                   fprintf (dump_file, "  ");
2817                   print_gimple_stmt (dump_file, gsi_stmt (bsi), 0);
2818                 }
2819               predicate_for_phi_result (info, bsi.phi (), &phi_predicate,
2820                                         nonconstant_names);
2821             }
2822         }
2823
2824       fix_builtin_expect_stmt = find_foldable_builtin_expect (bb);
2825
2826       for (gimple_stmt_iterator bsi = gsi_start_nondebug_bb (bb);
2827            !gsi_end_p (bsi); gsi_next_nondebug (&bsi))
2828         {
2829           gimple *stmt = gsi_stmt (bsi);
2830           int this_size = estimate_num_insns (stmt, &eni_size_weights);
2831           int this_time = estimate_num_insns (stmt, &eni_time_weights);
2832           int prob;
2833           ipa_predicate will_be_nonconstant;
2834
2835           /* This relation stmt should be folded after we remove
2836              __builtin_expect call. Adjust the cost here.  */
2837           if (stmt == fix_builtin_expect_stmt)
2838             {
2839               this_size--;
2840               this_time--;
2841             }
2842
2843           if (dump_file && (dump_flags & TDF_DETAILS))
2844             {
2845               fprintf (dump_file, "  ");
2846               print_gimple_stmt (dump_file, stmt, 0);
2847               fprintf (dump_file, "\t\tfreq:%3.2f size:%3i time:%3i\n",
2848                        freq.to_double (), this_size,
2849                        this_time);
2850             }
2851
2852           if (is_gimple_call (stmt)
2853               && !gimple_call_internal_p (stmt))
2854             {
2855               struct cgraph_edge *edge = node->get_edge (stmt);
2856               ipa_call_summary *es = ipa_call_summaries->get_create (edge);
2857
2858               /* Special case: results of BUILT_IN_CONSTANT_P will be always
2859                  resolved as constant.  We however don't want to optimize
2860                  out the cgraph edges.  */
2861               if (nonconstant_names.exists ()
2862                   && gimple_call_builtin_p (stmt, BUILT_IN_CONSTANT_P)
2863                   && gimple_call_lhs (stmt)
2864                   && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
2865                 {
2866                   ipa_predicate false_p = false;
2867                   nonconstant_names[SSA_NAME_VERSION (gimple_call_lhs (stmt))]
2868                     = false_p;
2869                 }
2870               if (ipa_node_params_sum)
2871                 {
2872                   int count = gimple_call_num_args (stmt);
2873                   int i;
2874
2875                   if (count)
2876                     es->param.safe_grow_cleared (count, true);
2877                   for (i = 0; i < count; i++)
2878                     {
2879                       int prob = param_change_prob (&fbi, stmt, i);
2880                       gcc_assert (prob >= 0 && prob <= REG_BR_PROB_BASE);
2881                       es->param[i].change_prob = prob;
2882                       es->param[i].points_to_local_or_readonly_memory
2883                          = points_to_local_or_readonly_memory_p
2884                              (gimple_call_arg (stmt, i));
2885                       es->param[i].points_to_possible_sra_candidate
2886                          = points_to_possible_sra_candidate_p
2887                              (gimple_call_arg (stmt, i));
2888                     }
2889                 }
2890               /* We cannot setup VLA parameters during inlining.  */
2891               for (unsigned int i = 0; i < gimple_call_num_args (stmt); ++i)
2892                 if (TREE_CODE (gimple_call_arg (stmt, i)) == WITH_SIZE_EXPR)
2893                   {
2894                     edge->inline_failed = CIF_FUNCTION_NOT_INLINABLE;
2895                     break;
2896                   }
2897               es->call_stmt_size = this_size;
2898               es->call_stmt_time = this_time;
2899               es->loop_depth = bb_loop_depth (bb);
2900               edge_set_predicate (edge, &bb_predicate);
2901               if (edge->speculative)
2902                 {
2903                   cgraph_edge *indirect
2904                         = edge->speculative_call_indirect_edge ();
2905                   ipa_call_summary *es2
2906                          = ipa_call_summaries->get_create (indirect);
2907                   ipa_call_summaries->duplicate (edge, indirect,
2908                                                  es, es2);
2909
2910                   /* Edge is the first direct call.
2911                      create and duplicate call summaries for multiple
2912                      speculative call targets.  */
2913                   for (cgraph_edge *direct
2914                          = edge->next_speculative_call_target ();
2915                        direct;
2916                        direct = direct->next_speculative_call_target ())
2917                     {
2918                       ipa_call_summary *es3
2919                         = ipa_call_summaries->get_create (direct);
2920                       ipa_call_summaries->duplicate (edge, direct,
2921                                                      es, es3);
2922                     }
2923                 }
2924             }
2925
2926           /* TODO: When conditional jump or switch is known to be constant, but
2927              we did not translate it into the predicates, we really can account
2928              just maximum of the possible paths.  */
2929           if (fbi.info)
2930             will_be_nonconstant
2931               = will_be_nonconstant_predicate (&fbi, info, params_summary,
2932                                                stmt, nonconstant_names);
2933           else
2934             will_be_nonconstant = true;
2935           if (this_time || this_size)
2936             {
2937               sreal final_time = (sreal)this_time * freq;
2938               prob = eliminated_by_inlining_prob (&fbi, stmt);
2939               if (prob == 1 && dump_file && (dump_flags & TDF_DETAILS))
2940                 fprintf (dump_file,
2941                          "\t\t50%% will be eliminated by inlining\n");
2942               if (prob == 2 && dump_file && (dump_flags & TDF_DETAILS))
2943                 fprintf (dump_file, "\t\tWill be eliminated by inlining\n");
2944
2945               ipa_predicate p = bb_predicate & will_be_nonconstant;
2946               int parm = load_or_store_of_ptr_parameter (&fbi, stmt);
2947               ipa_predicate sra_predicate = true;
2948               if (parm != -1)
2949                 sra_predicate &= add_condition (info, params_summary, parm,
2950                                                 ptr_type_node, NULL,
2951                                                 ipa_predicate::not_sra_candidate, NULL, 0);
2952
2953               /* We can ignore statement when we proved it is never going
2954                  to happen, but we cannot do that for call statements
2955                  because edges are accounted specially.  */
2956
2957               if (*(is_gimple_call (stmt) ? &bb_predicate : &p) != false)
2958                 {
2959                   time += final_time;
2960                   size += this_size;
2961                 }
2962
2963               /* We account everything but the calls.  Calls have their own
2964                  size/time info attached to cgraph edges.  This is necessary
2965                  in order to make the cost disappear after inlining.  */
2966               if (!is_gimple_call (stmt))
2967                 {
2968                   if (prob)
2969                     {
2970                       ipa_predicate ip
2971                         = bb_predicate & ipa_predicate::not_inlined () & sra_predicate;
2972                       info->account_size_time (this_size * prob,
2973                                                (final_time * prob) / 2, ip,
2974                                                p);
2975                     }
2976                   if (prob != 2)
2977                     info->account_size_time (this_size * (2 - prob),
2978                                              (final_time * (2 - prob) / 2),
2979                                              bb_predicate & sra_predicate,
2980                                              p);
2981                 }
2982
2983               if (!info->fp_expressions && fp_expression_p (stmt))
2984                 {
2985                   info->fp_expressions = true;
2986                   if (dump_file)
2987                     fprintf (dump_file, "   fp_expression set\n");
2988                 }
2989             }
2990
2991           /* For target specific information, we want to scan all statements
2992              rather than those statements with non-zero weights, to avoid
2993              missing to scan something interesting for target information,
2994              such as: internal function calls.  */
2995           if (scan_for_target_info)
2996             scan_for_target_info =
2997               targetm.target_option.update_ipa_fn_target_info
2998               (info->target_info, stmt);
2999
3000           /* Account cost of address calculations in the statements.  */
3001           for (unsigned int i = 0; i < gimple_num_ops (stmt); i++)
3002             {
3003               for (tree op = gimple_op (stmt, i);
3004                    op && handled_component_p (op);
3005                    op = TREE_OPERAND (op, 0))
3006                 if ((TREE_CODE (op) == ARRAY_REF
3007                      || TREE_CODE (op) == ARRAY_RANGE_REF)
3008                     && TREE_CODE (TREE_OPERAND (op, 1)) == SSA_NAME)
3009                   {
3010                     ipa_predicate p = bb_predicate;
3011                     if (fbi.info)
3012                       p = p & will_be_nonconstant_expr_predicate
3013                                  (&fbi, info, params_summary,
3014                                   TREE_OPERAND (op, 1),
3015                                   nonconstant_names);
3016                     if (p != false)
3017                       {
3018                         time += freq;
3019                         size += 1;
3020                         if (dump_file)
3021                           fprintf (dump_file,
3022                                    "\t\tAccounting address calculation.\n");
3023                         info->account_size_time (ipa_fn_summary::size_scale,
3024                                                  freq,
3025                                                  bb_predicate,
3026                                                  p);
3027                       }
3028                   }
3029             }
3030
3031         }
3032     }
3033   free (order);
3034
3035   if (nonconstant_names.exists () && !early)
3036     {
3037       ipa_fn_summary *s = ipa_fn_summaries->get (node);
3038       unsigned max_loop_predicates = opt_for_fn (node->decl,
3039                                                  param_ipa_max_loop_predicates);
3040
3041       if (dump_file && (dump_flags & TDF_DETAILS))
3042         flow_loops_dump (dump_file, NULL, 0);
3043       scev_initialize ();
3044       for (auto loop : loops_list (cfun, 0))
3045         {
3046           ipa_predicate loop_iterations = true;
3047           sreal header_freq;
3048           edge ex;
3049           unsigned int j;
3050           class tree_niter_desc niter_desc;
3051           if (!loop->header->aux)
3052             continue;
3053
3054           profile_count phdr_count = loop_preheader_edge (loop)->count ();
3055           sreal phdr_freq = phdr_count.to_sreal_scale (entry_count);
3056
3057           bb_predicate = *(ipa_predicate *)loop->header->aux;
3058           auto_vec<edge> exits = get_loop_exit_edges (loop);
3059           FOR_EACH_VEC_ELT (exits, j, ex)
3060             if (number_of_iterations_exit (loop, ex, &niter_desc, false)
3061                 && !is_gimple_min_invariant (niter_desc.niter))
3062             {
3063               ipa_predicate will_be_nonconstant
3064                 = will_be_nonconstant_expr_predicate (&fbi, info,
3065                                                       params_summary,
3066                                                       niter_desc.niter,
3067                                                       nonconstant_names);
3068               if (will_be_nonconstant != true)
3069                 will_be_nonconstant = bb_predicate & will_be_nonconstant;
3070               if (will_be_nonconstant != true
3071                   && will_be_nonconstant != false)
3072                 loop_iterations &= will_be_nonconstant;
3073             }
3074           add_freqcounting_predicate (&s->loop_iterations, loop_iterations,
3075                                       phdr_freq, max_loop_predicates);
3076         }
3077
3078       /* To avoid quadratic behavior we analyze stride predicates only
3079          with respect to the containing loop.  Thus we simply iterate
3080          over all defs in the outermost loop body.  */
3081       for (class loop *loop = loops_for_fn (cfun)->tree_root->inner;
3082            loop != NULL; loop = loop->next)
3083         {
3084           ipa_predicate loop_stride = true;
3085           basic_block *body = get_loop_body (loop);
3086           profile_count phdr_count = loop_preheader_edge (loop)->count ();
3087           sreal phdr_freq = phdr_count.to_sreal_scale (entry_count);
3088           for (unsigned i = 0; i < loop->num_nodes; i++)
3089             {
3090               gimple_stmt_iterator gsi;
3091               if (!body[i]->aux)
3092                 continue;
3093
3094               bb_predicate = *(ipa_predicate *)body[i]->aux;
3095               for (gsi = gsi_start_bb (body[i]); !gsi_end_p (gsi);
3096                    gsi_next (&gsi))
3097                 {
3098                   gimple *stmt = gsi_stmt (gsi);
3099
3100                   if (!is_gimple_assign (stmt))
3101                     continue;
3102
3103                   tree def = gimple_assign_lhs (stmt);
3104                   if (TREE_CODE (def) != SSA_NAME)
3105                     continue;
3106
3107                   affine_iv iv;
3108                   if (!simple_iv (loop_containing_stmt (stmt),
3109                                   loop_containing_stmt (stmt),
3110                                   def, &iv, true)
3111                       || is_gimple_min_invariant (iv.step))
3112                     continue;
3113
3114                   ipa_predicate will_be_nonconstant
3115                     = will_be_nonconstant_expr_predicate (&fbi, info,
3116                                                           params_summary,
3117                                                           iv.step,
3118                                                           nonconstant_names);
3119                   if (will_be_nonconstant != true)
3120                     will_be_nonconstant = bb_predicate & will_be_nonconstant;
3121                   if (will_be_nonconstant != true
3122                       && will_be_nonconstant != false)
3123                     loop_stride = loop_stride & will_be_nonconstant;
3124                 }
3125             }
3126           add_freqcounting_predicate (&s->loop_strides, loop_stride,
3127                                       phdr_freq, max_loop_predicates);
3128           free (body);
3129         }
3130       scev_finalize ();
3131     }
3132   FOR_ALL_BB_FN (bb, my_function)
3133     {
3134       edge e;
3135       edge_iterator ei;
3136
3137       if (bb->aux)
3138         edge_predicate_pool.remove ((ipa_predicate *)bb->aux);
3139       bb->aux = NULL;
3140       FOR_EACH_EDGE (e, ei, bb->succs)
3141         {
3142           if (e->aux)
3143             edge_predicate_pool.remove ((ipa_predicate *)e->aux);
3144           e->aux = NULL;
3145         }
3146     }
3147   ipa_fn_summary *s = ipa_fn_summaries->get (node);
3148   ipa_size_summary *ss = ipa_size_summaries->get (node);
3149   s->time = time;
3150   ss->self_size = size;
3151   nonconstant_names.release ();
3152   ipa_release_body_info (&fbi);
3153   if (opt_for_fn (node->decl, optimize))
3154     {
3155       if (!early)
3156         loop_optimizer_finalize ();
3157       else if (!ipa_edge_args_sum)
3158         ipa_free_all_node_params ();
3159       free_dominance_info (CDI_DOMINATORS);
3160       free_dominance_info (CDI_POST_DOMINATORS);
3161     }
3162   if (dump_file)
3163     {
3164       fprintf (dump_file, "\n");
3165       ipa_dump_fn_summary (dump_file, node);
3166     }
3167 }
3168
3169
3170 /* Compute function summary.
3171    EARLY is true when we compute parameters during early opts.  */
3172
3173 void
3174 compute_fn_summary (struct cgraph_node *node, bool early)
3175 {
3176   HOST_WIDE_INT self_stack_size;
3177   struct cgraph_edge *e;
3178
3179   gcc_assert (!node->inlined_to);
3180
3181   if (!ipa_fn_summaries)
3182     ipa_fn_summary_alloc ();
3183
3184   /* Create a new ipa_fn_summary.  */
3185   ((ipa_fn_summary_t *)ipa_fn_summaries)->remove_callees (node);
3186   ipa_fn_summaries->remove (node);
3187   class ipa_fn_summary *info = ipa_fn_summaries->get_create (node);
3188   class ipa_size_summary *size_info = ipa_size_summaries->get_create (node);
3189
3190   /* Estimate the stack size for the function if we're optimizing.  */
3191   self_stack_size = optimize && !node->thunk
3192                     ? estimated_stack_frame_size (node) : 0;
3193   size_info->estimated_self_stack_size = self_stack_size;
3194   info->estimated_stack_size = self_stack_size;
3195
3196   if (node->thunk)
3197     {
3198       ipa_call_summary *es = ipa_call_summaries->get_create (node->callees);
3199       ipa_predicate t = true;
3200
3201       node->can_change_signature = false;
3202       es->call_stmt_size = eni_size_weights.call_cost;
3203       es->call_stmt_time = eni_time_weights.call_cost;
3204       info->account_size_time (ipa_fn_summary::size_scale
3205                                * opt_for_fn (node->decl,
3206                                  param_uninlined_function_thunk_insns),
3207                                opt_for_fn (node->decl,
3208                                  param_uninlined_function_thunk_time), t, t);
3209       t = ipa_predicate::not_inlined ();
3210       info->account_size_time (2 * ipa_fn_summary::size_scale, 0, t, t);
3211       ipa_update_overall_fn_summary (node);
3212       size_info->self_size = size_info->size;
3213       if (stdarg_p (TREE_TYPE (node->decl)))
3214         {
3215           info->inlinable = false;
3216           node->callees->inline_failed = CIF_VARIADIC_THUNK;
3217         }
3218       else
3219         info->inlinable = true;
3220     }
3221   else
3222     {
3223        /* Even is_gimple_min_invariant rely on current_function_decl.  */
3224        push_cfun (DECL_STRUCT_FUNCTION (node->decl));
3225
3226        /* During IPA profile merging we may be called w/o virtual SSA form
3227           built.  */
3228        update_ssa (TODO_update_ssa_only_virtuals);
3229
3230        /* Can this function be inlined at all?  */
3231        if (!opt_for_fn (node->decl, optimize)
3232            && !lookup_attribute ("always_inline",
3233                                  DECL_ATTRIBUTES (node->decl)))
3234          info->inlinable = false;
3235        else
3236          info->inlinable = tree_inlinable_function_p (node->decl);
3237
3238        bool no_signature = false;
3239        /* Type attributes can use parameter indices to describe them.
3240           Special case fn spec since we can safely preserve them in
3241           modref summaries.  */
3242        for (tree list = TYPE_ATTRIBUTES (TREE_TYPE (node->decl));
3243             list && !no_signature; list = TREE_CHAIN (list))
3244         if (!ipa_param_adjustments::type_attribute_allowed_p
3245                         (get_attribute_name (list)))
3246            {
3247              if (dump_file)
3248                 {
3249                   fprintf (dump_file, "No signature change:"
3250                            " function type has unhandled attribute %s.\n",
3251                            IDENTIFIER_POINTER (get_attribute_name (list)));
3252                 }
3253              no_signature = true;
3254            }
3255        for (tree parm = DECL_ARGUMENTS (node->decl);
3256             parm && !no_signature; parm = DECL_CHAIN (parm))
3257          if (variably_modified_type_p (TREE_TYPE (parm), node->decl))
3258            {
3259              if (dump_file)
3260                 {
3261                   fprintf (dump_file, "No signature change:"
3262                            " has parameter with variably modified type.\n");
3263                 }
3264              no_signature = true;
3265            }
3266
3267        /* Likewise for #pragma omp declare simd functions or functions
3268           with simd attribute.  */
3269        if (no_signature
3270            || lookup_attribute ("omp declare simd",
3271                                 DECL_ATTRIBUTES (node->decl)))
3272          node->can_change_signature = false;
3273        else
3274          {
3275            /* Otherwise, inlinable functions always can change signature.  */
3276            if (info->inlinable)
3277              node->can_change_signature = true;
3278            else
3279              {
3280                /* Functions calling builtin_apply cannot change signature.  */
3281                for (e = node->callees; e; e = e->next_callee)
3282                  {
3283                    tree cdecl = e->callee->decl;
3284                    if (fndecl_built_in_p (cdecl, BUILT_IN_APPLY_ARGS,
3285                                                  BUILT_IN_VA_START))
3286                      break;
3287                  }
3288                node->can_change_signature = !e;
3289              }
3290          }
3291        analyze_function_body (node, early);
3292        pop_cfun ();
3293      }
3294
3295   /* Inlining characteristics are maintained by the cgraph_mark_inline.  */
3296   size_info->size = size_info->self_size;
3297   info->estimated_stack_size = size_info->estimated_self_stack_size;
3298
3299   /* Code above should compute exactly the same result as
3300      ipa_update_overall_fn_summary except for case when speculative
3301      edges are present since these are accounted to size but not
3302      self_size. Do not compare time since different order the roundoff
3303      errors result in slight changes.  */
3304   ipa_update_overall_fn_summary (node);
3305   if (flag_checking)
3306     {
3307       for (e = node->indirect_calls; e; e = e->next_callee)
3308        if (e->speculative)
3309          break;
3310       gcc_assert (e || size_info->size == size_info->self_size);
3311     }
3312 }
3313
3314
3315 /* Compute parameters of functions used by inliner using
3316    current_function_decl.  */
3317
3318 static unsigned int
3319 compute_fn_summary_for_current (void)
3320 {
3321   compute_fn_summary (cgraph_node::get (current_function_decl), true);
3322   return 0;
3323 }
3324
3325 /* Estimate benefit devirtualizing indirect edge IE and return true if it can
3326    be devirtualized and inlined, provided m_known_vals, m_known_contexts and
3327    m_known_aggs in AVALS.  Return false straight away if AVALS is NULL.  */
3328
3329 static bool
3330 estimate_edge_devirt_benefit (struct cgraph_edge *ie,
3331                               int *size, int *time,
3332                               ipa_call_arg_values *avals)
3333 {
3334   tree target;
3335   struct cgraph_node *callee;
3336   class ipa_fn_summary *isummary;
3337   enum availability avail;
3338   bool speculative;
3339
3340   if (!avals
3341       || (!avals->m_known_vals.length() && !avals->m_known_contexts.length ()))
3342     return false;
3343   if (!opt_for_fn (ie->caller->decl, flag_indirect_inlining))
3344     return false;
3345
3346   target = ipa_get_indirect_edge_target (ie, avals, &speculative);
3347   if (!target || speculative)
3348     return false;
3349
3350   /* Account for difference in cost between indirect and direct calls.  */
3351   *size -= (eni_size_weights.indirect_call_cost - eni_size_weights.call_cost);
3352   *time -= (eni_time_weights.indirect_call_cost - eni_time_weights.call_cost);
3353   gcc_checking_assert (*time >= 0);
3354   gcc_checking_assert (*size >= 0);
3355
3356   callee = cgraph_node::get (target);
3357   if (!callee || !callee->definition)
3358     return false;
3359   callee = callee->function_symbol (&avail);
3360   if (avail < AVAIL_AVAILABLE)
3361     return false;
3362   isummary = ipa_fn_summaries->get (callee);
3363   if (isummary == NULL)
3364     return false;
3365
3366   return isummary->inlinable;
3367 }
3368
3369 /* Increase SIZE, MIN_SIZE (if non-NULL) and TIME for size and time needed to
3370    handle edge E with probability PROB.  Set HINTS accordingly if edge may be
3371    devirtualized.  AVALS, if non-NULL, describes the context of the call site
3372    as far as values of parameters are concerened.  */
3373
3374 static inline void
3375 estimate_edge_size_and_time (struct cgraph_edge *e, int *size, int *min_size,
3376                              sreal *time, ipa_call_arg_values *avals,
3377                              ipa_hints *hints)
3378 {
3379   class ipa_call_summary *es = ipa_call_summaries->get (e);
3380   int call_size = es->call_stmt_size;
3381   int call_time = es->call_stmt_time;
3382   int cur_size;
3383
3384   if (!e->callee && hints && e->maybe_hot_p ()
3385       && estimate_edge_devirt_benefit (e, &call_size, &call_time, avals))
3386     *hints |= INLINE_HINT_indirect_call;
3387   cur_size = call_size * ipa_fn_summary::size_scale;
3388   *size += cur_size;
3389   if (min_size)
3390     *min_size += cur_size;
3391   if (time)
3392     *time += ((sreal)call_time) * e->sreal_frequency ();
3393 }
3394
3395
3396 /* Increase SIZE, MIN_SIZE and TIME for size and time needed to handle all
3397    calls in NODE.  POSSIBLE_TRUTHS and AVALS describe the context of the call
3398    site.
3399
3400    Helper for estimate_calls_size_and_time which does the same but
3401    (in most cases) faster.  */
3402
3403 static void
3404 estimate_calls_size_and_time_1 (struct cgraph_node *node, int *size,
3405                                 int *min_size, sreal *time,
3406                                 ipa_hints *hints,
3407                                 clause_t possible_truths,
3408                                 ipa_call_arg_values *avals)
3409 {
3410   struct cgraph_edge *e;
3411   for (e = node->callees; e; e = e->next_callee)
3412     {
3413       if (!e->inline_failed)
3414         {
3415           gcc_checking_assert (!ipa_call_summaries->get (e));
3416           estimate_calls_size_and_time_1 (e->callee, size, min_size, time,
3417                                           hints, possible_truths, avals);
3418
3419           continue;
3420         }
3421       class ipa_call_summary *es = ipa_call_summaries->get (e);
3422
3423       /* Do not care about zero sized builtins.  */
3424       if (!es->call_stmt_size)
3425         {
3426           gcc_checking_assert (!es->call_stmt_time);
3427           continue;
3428         }
3429       if (!es->predicate
3430           || es->predicate->evaluate (possible_truths))
3431         {
3432           /* Predicates of calls shall not use NOT_CHANGED codes,
3433              so we do not need to compute probabilities.  */
3434           estimate_edge_size_and_time (e, size,
3435                                        es->predicate ? NULL : min_size,
3436                                        time, avals, hints);
3437         }
3438     }
3439   for (e = node->indirect_calls; e; e = e->next_callee)
3440     {
3441       class ipa_call_summary *es = ipa_call_summaries->get (e);
3442       if (!es->predicate
3443           || es->predicate->evaluate (possible_truths))
3444         estimate_edge_size_and_time (e, size,
3445                                      es->predicate ? NULL : min_size,
3446                                      time, avals, hints);
3447     }
3448 }
3449
3450 /* Populate sum->call_size_time_table for edges from NODE.  */
3451
3452 static void
3453 summarize_calls_size_and_time (struct cgraph_node *node,
3454                                ipa_fn_summary *sum)
3455 {
3456   struct cgraph_edge *e;
3457   for (e = node->callees; e; e = e->next_callee)
3458     {
3459       if (!e->inline_failed)
3460         {
3461           gcc_checking_assert (!ipa_call_summaries->get (e));
3462           summarize_calls_size_and_time (e->callee, sum);
3463           continue;
3464         }
3465       int size = 0;
3466       sreal time = 0;
3467
3468       estimate_edge_size_and_time (e, &size, NULL, &time, NULL, NULL);
3469
3470       ipa_predicate pred = true;
3471       class ipa_call_summary *es = ipa_call_summaries->get (e);
3472
3473       if (es->predicate)
3474         pred = *es->predicate;
3475       sum->account_size_time (size, time, pred, pred, true);
3476     }
3477   for (e = node->indirect_calls; e; e = e->next_callee)
3478     {
3479       int size = 0;
3480       sreal time = 0;
3481
3482       estimate_edge_size_and_time (e, &size, NULL, &time, NULL, NULL);
3483       ipa_predicate pred = true;
3484       class ipa_call_summary *es = ipa_call_summaries->get (e);
3485
3486       if (es->predicate)
3487         pred = *es->predicate;
3488       sum->account_size_time (size, time, pred, pred, true);
3489     }
3490 }
3491
3492 /* Increase SIZE, MIN_SIZE and TIME for size and time needed to handle all
3493    calls in NODE.  POSSIBLE_TRUTHS and AVALS (the latter if non-NULL) describe
3494    context of the call site.  */
3495
3496 static void
3497 estimate_calls_size_and_time (struct cgraph_node *node, int *size,
3498                               int *min_size, sreal *time,
3499                               ipa_hints *hints,
3500                               clause_t possible_truths,
3501                               ipa_call_arg_values *avals)
3502 {
3503   class ipa_fn_summary *sum = ipa_fn_summaries->get (node);
3504   bool use_table = true;
3505
3506   gcc_assert (node->callees || node->indirect_calls);
3507
3508   /* During early inlining we do not calculate info for very
3509      large functions and thus there is no need for producing
3510      summaries.  */
3511   if (!ipa_node_params_sum)
3512     use_table = false;
3513   /* Do not calculate summaries for simple wrappers; it is waste
3514      of memory.  */
3515   else if (node->callees && node->indirect_calls
3516            && node->callees->inline_failed && !node->callees->next_callee)
3517     use_table = false;
3518   /* If there is an indirect edge that may be optimized, we need
3519      to go the slow way.  */
3520   else if (avals && hints
3521            && (avals->m_known_vals.length ()
3522                || avals->m_known_contexts.length ()
3523                || avals->m_known_aggs.length ()))
3524     {
3525       ipa_node_params *params_summary = ipa_node_params_sum->get (node);
3526       unsigned int nargs = params_summary
3527                            ? ipa_get_param_count (params_summary) : 0;
3528
3529       for (unsigned int i = 0; i < nargs && use_table; i++)
3530         {
3531           if (ipa_is_param_used_by_indirect_call (params_summary, i)
3532               && (avals->safe_sval_at (i)
3533                   || (ipa_argagg_value_list (avals).value_for_index_p (i))))
3534             use_table = false;
3535           else if (ipa_is_param_used_by_polymorphic_call (params_summary, i)
3536                    && (avals->m_known_contexts.length () > i
3537                        && !avals->m_known_contexts[i].useless_p ()))
3538             use_table = false;
3539         }
3540     }
3541
3542   /* Fast path is via the call size time table.  */
3543   if (use_table)
3544     {
3545       /* Build summary if it is absent.  */
3546       if (!sum->call_size_time_table.length ())
3547         {
3548           ipa_predicate true_pred = true;
3549           sum->account_size_time (0, 0, true_pred, true_pred, true);
3550           summarize_calls_size_and_time (node, sum);
3551         }
3552
3553       int old_size = *size;
3554       sreal old_time = time ? *time : 0;
3555
3556       if (min_size)
3557         *min_size += sum->call_size_time_table[0].size;
3558
3559       unsigned int i;
3560       size_time_entry *e;
3561
3562       /* Walk the table and account sizes and times.  */
3563       for (i = 0; sum->call_size_time_table.iterate (i, &e);
3564            i++)
3565         if (e->exec_predicate.evaluate (possible_truths))
3566           {
3567             *size += e->size;
3568             if (time)
3569               *time += e->time;
3570           }
3571
3572       /* Be careful and see if both methods agree.  */
3573       if ((flag_checking || dump_file)
3574           /* Do not try to sanity check when we know we lost some
3575              precision.  */
3576           && sum->call_size_time_table.length ()
3577              < ipa_fn_summary::max_size_time_table_size)
3578         {
3579           estimate_calls_size_and_time_1 (node, &old_size, NULL, &old_time, NULL,
3580                                           possible_truths, avals);
3581           gcc_assert (*size == old_size);
3582           if (time && (*time - old_time > 1 || *time - old_time < -1)
3583               && dump_file)
3584             fprintf (dump_file, "Time mismatch in call summary %f!=%f\n",
3585                      old_time.to_double (),
3586                      time->to_double ());
3587         }
3588     }
3589   /* Slow path by walking all edges.  */
3590   else
3591     estimate_calls_size_and_time_1 (node, size, min_size, time, hints,
3592                                     possible_truths, avals);
3593 }
3594
3595 /* Main constructor for ipa call context.  Memory allocation of ARG_VALUES
3596    is owned by the caller.  INLINE_PARAM_SUMMARY is also owned by the
3597    caller.  */
3598
3599 ipa_call_context::ipa_call_context (cgraph_node *node, clause_t possible_truths,
3600                                     clause_t nonspec_possible_truths,
3601                                     vec<inline_param_summary>
3602                                       inline_param_summary,
3603                                     ipa_auto_call_arg_values *arg_values)
3604 : m_node (node), m_possible_truths (possible_truths),
3605   m_nonspec_possible_truths (nonspec_possible_truths),
3606   m_inline_param_summary (inline_param_summary),
3607   m_avals (arg_values)
3608 {
3609 }
3610
3611 /* Set THIS to be a duplicate of CTX.  Copy all relevant info.  */
3612
3613 void
3614 ipa_cached_call_context::duplicate_from (const ipa_call_context &ctx)
3615 {
3616   m_node = ctx.m_node;
3617   m_possible_truths = ctx.m_possible_truths;
3618   m_nonspec_possible_truths = ctx.m_nonspec_possible_truths;
3619   ipa_node_params *params_summary = ipa_node_params_sum->get (m_node);
3620   unsigned int nargs = params_summary
3621                        ? ipa_get_param_count (params_summary) : 0;
3622
3623   m_inline_param_summary = vNULL;
3624   /* Copy the info only if there is at least one useful entry.  */
3625   if (ctx.m_inline_param_summary.exists ())
3626     {
3627       unsigned int n = MIN (ctx.m_inline_param_summary.length (), nargs);
3628
3629       for (unsigned int i = 0; i < n; i++)
3630         if (ipa_is_param_used_by_ipa_predicates (params_summary, i)
3631             && !ctx.m_inline_param_summary[i].useless_p ())
3632           {
3633             m_inline_param_summary
3634                     = ctx.m_inline_param_summary.copy ();
3635             break;
3636           }
3637     }
3638   m_avals.m_known_vals = vNULL;
3639   if (ctx.m_avals.m_known_vals.exists ())
3640     {
3641       unsigned int n = MIN (ctx.m_avals.m_known_vals.length (), nargs);
3642
3643       for (unsigned int i = 0; i < n; i++)
3644         if (ipa_is_param_used_by_indirect_call (params_summary, i)
3645             && ctx.m_avals.m_known_vals[i])
3646           {
3647             m_avals.m_known_vals = ctx.m_avals.m_known_vals.copy ();
3648             break;
3649           }
3650     }
3651
3652   m_avals.m_known_contexts = vNULL;
3653   if (ctx.m_avals.m_known_contexts.exists ())
3654     {
3655       unsigned int n = MIN (ctx.m_avals.m_known_contexts.length (), nargs);
3656
3657       for (unsigned int i = 0; i < n; i++)
3658         if (ipa_is_param_used_by_polymorphic_call (params_summary, i)
3659             && !ctx.m_avals.m_known_contexts[i].useless_p ())
3660           {
3661             m_avals.m_known_contexts = ctx.m_avals.m_known_contexts.copy ();
3662             break;
3663           }
3664     }
3665
3666   m_avals.m_known_aggs = vNULL;
3667   if (ctx.m_avals.m_known_aggs.exists ())
3668     {
3669       const ipa_argagg_value_list avl (&ctx.m_avals);
3670       for (unsigned int i = 0; i < nargs; i++)
3671         if (ipa_is_param_used_by_indirect_call (params_summary, i)
3672             && avl.value_for_index_p (i))
3673           {
3674             m_avals.m_known_aggs = ctx.m_avals.m_known_aggs.copy ();
3675             break;
3676           }
3677     }
3678
3679   m_avals.m_known_value_ranges = vNULL;
3680 }
3681
3682 /* Release memory used by known_vals/contexts/aggs vectors.  and
3683    inline_param_summary.  */
3684
3685 void
3686 ipa_cached_call_context::release ()
3687 {
3688   /* See if context is initialized at first place.  */
3689   if (!m_node)
3690     return;
3691   m_avals.m_known_aggs.release ();
3692   m_avals.m_known_vals.release ();
3693   m_avals.m_known_contexts.release ();
3694   m_inline_param_summary.release ();
3695 }
3696
3697 /* Return true if CTX describes the same call context as THIS.  */
3698
3699 bool
3700 ipa_call_context::equal_to (const ipa_call_context &ctx)
3701 {
3702   if (m_node != ctx.m_node
3703       || m_possible_truths != ctx.m_possible_truths
3704       || m_nonspec_possible_truths != ctx.m_nonspec_possible_truths)
3705     return false;
3706
3707   ipa_node_params *params_summary = ipa_node_params_sum->get (m_node);
3708   unsigned int nargs = params_summary
3709                        ? ipa_get_param_count (params_summary) : 0;
3710
3711   if (m_inline_param_summary.exists () || ctx.m_inline_param_summary.exists ())
3712     {
3713       for (unsigned int i = 0; i < nargs; i++)
3714         {
3715           if (!ipa_is_param_used_by_ipa_predicates (params_summary, i))
3716             continue;
3717           if (i >= m_inline_param_summary.length ()
3718               || m_inline_param_summary[i].useless_p ())
3719             {
3720               if (i < ctx.m_inline_param_summary.length ()
3721                   && !ctx.m_inline_param_summary[i].useless_p ())
3722                 return false;
3723               continue;
3724             }
3725           if (i >= ctx.m_inline_param_summary.length ()
3726               || ctx.m_inline_param_summary[i].useless_p ())
3727             {
3728               if (i < m_inline_param_summary.length ()
3729                   && !m_inline_param_summary[i].useless_p ())
3730                 return false;
3731               continue;
3732             }
3733           if (!m_inline_param_summary[i].equal_to
3734                  (ctx.m_inline_param_summary[i]))
3735             return false;
3736         }
3737     }
3738   if (m_avals.m_known_vals.exists () || ctx.m_avals.m_known_vals.exists ())
3739     {
3740       for (unsigned int i = 0; i < nargs; i++)
3741         {
3742           if (!ipa_is_param_used_by_indirect_call (params_summary, i))
3743             continue;
3744           if (i >= m_avals.m_known_vals.length () || !m_avals.m_known_vals[i])
3745             {
3746               if (i < ctx.m_avals.m_known_vals.length ()
3747                   && ctx.m_avals.m_known_vals[i])
3748                 return false;
3749               continue;
3750             }
3751           if (i >= ctx.m_avals.m_known_vals.length ()
3752               || !ctx.m_avals.m_known_vals[i])
3753             {
3754               if (i < m_avals.m_known_vals.length () && m_avals.m_known_vals[i])
3755                 return false;
3756               continue;
3757             }
3758           if (m_avals.m_known_vals[i] != ctx.m_avals.m_known_vals[i])
3759             return false;
3760         }
3761     }
3762   if (m_avals.m_known_contexts.exists ()
3763       || ctx.m_avals.m_known_contexts.exists ())
3764     {
3765       for (unsigned int i = 0; i < nargs; i++)
3766         {
3767           if (!ipa_is_param_used_by_polymorphic_call (params_summary, i))
3768             continue;
3769           if (i >= m_avals.m_known_contexts.length ()
3770               || m_avals.m_known_contexts[i].useless_p ())
3771             {
3772               if (i < ctx.m_avals.m_known_contexts.length ()
3773                   && !ctx.m_avals.m_known_contexts[i].useless_p ())
3774                 return false;
3775               continue;
3776             }
3777           if (i >= ctx.m_avals.m_known_contexts.length ()
3778               || ctx.m_avals.m_known_contexts[i].useless_p ())
3779             {
3780               if (i < m_avals.m_known_contexts.length ()
3781                   && !m_avals.m_known_contexts[i].useless_p ())
3782                 return false;
3783               continue;
3784             }
3785           if (!m_avals.m_known_contexts[i].equal_to
3786                  (ctx.m_avals.m_known_contexts[i]))
3787             return false;
3788         }
3789     }
3790   if (m_avals.m_known_aggs.exists () || ctx.m_avals.m_known_aggs.exists ())
3791     {
3792       unsigned i = 0, j = 0;
3793       while (i < m_avals.m_known_aggs.length ()
3794              || j < ctx.m_avals.m_known_aggs.length ())
3795         {
3796           if (i >= m_avals.m_known_aggs.length ())
3797             {
3798               int idx2 = ctx.m_avals.m_known_aggs[j].index;
3799               if (ipa_is_param_used_by_indirect_call (params_summary, idx2))
3800                 return false;
3801               j++;
3802               continue;
3803             }
3804           if (j >= ctx.m_avals.m_known_aggs.length ())
3805             {
3806               int idx1 = m_avals.m_known_aggs[i].index;
3807               if (ipa_is_param_used_by_indirect_call (params_summary, idx1))
3808                 return false;
3809               i++;
3810               continue;
3811             }
3812
3813           int idx1 = m_avals.m_known_aggs[i].index;
3814           int idx2 = ctx.m_avals.m_known_aggs[j].index;
3815           if (idx1 < idx2)
3816             {
3817               if (ipa_is_param_used_by_indirect_call (params_summary, idx1))
3818                 return false;
3819               i++;
3820               continue;
3821             }
3822           if (idx1 > idx2)
3823             {
3824               if (ipa_is_param_used_by_indirect_call (params_summary, idx2))
3825                 return false;
3826               j++;
3827               continue;
3828             }
3829           if (!ipa_is_param_used_by_indirect_call (params_summary, idx1))
3830             {
3831               i++;
3832               j++;
3833               continue;
3834             }
3835
3836           if ((m_avals.m_known_aggs[i].unit_offset
3837                != ctx.m_avals.m_known_aggs[j].unit_offset)
3838               || (m_avals.m_known_aggs[i].by_ref
3839                != ctx.m_avals.m_known_aggs[j].by_ref)
3840               || !operand_equal_p (m_avals.m_known_aggs[i].value,
3841                                    ctx.m_avals.m_known_aggs[j].value))
3842             return false;
3843           i++;
3844           j++;
3845         }
3846     }
3847   return true;
3848 }
3849
3850 /* Fill in the selected fields in ESTIMATES with value estimated for call in
3851    this context.  Always compute size and min_size.  Only compute time and
3852    nonspecialized_time if EST_TIMES is true.  Only compute hints if EST_HINTS
3853    is true.  */
3854
3855 void
3856 ipa_call_context::estimate_size_and_time (ipa_call_estimates *estimates,
3857                                           bool est_times, bool est_hints)
3858 {
3859   class ipa_fn_summary *info = ipa_fn_summaries->get (m_node);
3860   size_time_entry *e;
3861   int size = 0;
3862   sreal time = 0;
3863   int min_size = 0;
3864   ipa_hints hints = 0;
3865   sreal loops_with_known_iterations = 0;
3866   sreal loops_with_known_strides = 0;
3867   int i;
3868
3869   if (dump_file && (dump_flags & TDF_DETAILS))
3870     {
3871       bool found = false;
3872       fprintf (dump_file, "   Estimating body: %s\n"
3873                "   Known to be false: ", m_node->dump_name ());
3874
3875       for (i = ipa_predicate::not_inlined_condition;
3876            i < (ipa_predicate::first_dynamic_condition
3877                 + (int) vec_safe_length (info->conds)); i++)
3878         if (!(m_possible_truths & (1 << i)))
3879           {
3880             if (found)
3881               fprintf (dump_file, ", ");
3882             found = true;
3883             dump_condition (dump_file, info->conds, i);
3884           }
3885     }
3886
3887   if (m_node->callees || m_node->indirect_calls)
3888     estimate_calls_size_and_time (m_node, &size, &min_size,
3889                                   est_times ? &time : NULL,
3890                                   est_hints ? &hints : NULL, m_possible_truths,
3891                                   &m_avals);
3892
3893   sreal nonspecialized_time = time;
3894
3895   min_size += info->size_time_table[0].size;
3896   for (i = 0; info->size_time_table.iterate (i, &e); i++)
3897     {
3898       bool exec = e->exec_predicate.evaluate (m_nonspec_possible_truths);
3899
3900       /* Because predicates are conservative, it can happen that nonconst is 1
3901          but exec is 0.  */
3902       if (exec)
3903         {
3904           bool nonconst = e->nonconst_predicate.evaluate (m_possible_truths);
3905
3906           gcc_checking_assert (e->time >= 0);
3907           gcc_checking_assert (time >= 0);
3908
3909           /* We compute specialized size only because size of nonspecialized
3910              copy is context independent.
3911
3912              The difference between nonspecialized execution and specialized is
3913              that nonspecialized is not going to have optimized out computations
3914              known to be constant in a specialized setting.  */
3915           if (nonconst)
3916             size += e->size;
3917           if (!est_times)
3918             continue;
3919           nonspecialized_time += e->time;
3920           if (!nonconst)
3921             ;
3922           else if (!m_inline_param_summary.exists ())
3923             {
3924               if (nonconst)
3925                 time += e->time;
3926             }
3927           else
3928             {
3929               int prob = e->nonconst_predicate.probability
3930                                                (info->conds, m_possible_truths,
3931                                                 m_inline_param_summary);
3932               gcc_checking_assert (prob >= 0);
3933               gcc_checking_assert (prob <= REG_BR_PROB_BASE);
3934               if (prob == REG_BR_PROB_BASE)
3935                 time += e->time;
3936               else
3937                 time += e->time * prob / REG_BR_PROB_BASE;
3938             }
3939           gcc_checking_assert (time >= 0);
3940         }
3941      }
3942   gcc_checking_assert (info->size_time_table[0].exec_predicate == true);
3943   gcc_checking_assert (info->size_time_table[0].nonconst_predicate == true);
3944   gcc_checking_assert (min_size >= 0);
3945   gcc_checking_assert (size >= 0);
3946   gcc_checking_assert (time >= 0);
3947   /* nonspecialized_time should be always bigger than specialized time.
3948      Roundoff issues however may get into the way.  */
3949   gcc_checking_assert ((nonspecialized_time - time * 99 / 100) >= -1);
3950
3951   /* Roundoff issues may make specialized time bigger than nonspecialized
3952      time.  We do not really want that to happen because some heuristics
3953      may get confused by seeing negative speedups.  */
3954   if (time > nonspecialized_time)
3955     time = nonspecialized_time;
3956
3957   if (est_hints)
3958     {
3959       if (info->scc_no)
3960         hints |= INLINE_HINT_in_scc;
3961       if (DECL_DECLARED_INLINE_P (m_node->decl))
3962         hints |= INLINE_HINT_declared_inline;
3963       if (info->builtin_constant_p_parms.length ()
3964           && DECL_DECLARED_INLINE_P (m_node->decl))
3965         hints |= INLINE_HINT_builtin_constant_p;
3966
3967       ipa_freqcounting_predicate *fcp;
3968       for (i = 0; vec_safe_iterate (info->loop_iterations, i, &fcp); i++)
3969         if (!fcp->predicate->evaluate (m_possible_truths))
3970           {
3971             hints |= INLINE_HINT_loop_iterations;
3972             loops_with_known_iterations += fcp->freq;
3973           }
3974       estimates->loops_with_known_iterations = loops_with_known_iterations;
3975
3976       for (i = 0; vec_safe_iterate (info->loop_strides, i, &fcp); i++)
3977         if (!fcp->predicate->evaluate (m_possible_truths))
3978           {
3979             hints |= INLINE_HINT_loop_stride;
3980             loops_with_known_strides += fcp->freq;
3981           }
3982       estimates->loops_with_known_strides = loops_with_known_strides;
3983     }
3984
3985   size = RDIV (size, ipa_fn_summary::size_scale);
3986   min_size = RDIV (min_size, ipa_fn_summary::size_scale);
3987
3988   if (dump_file && (dump_flags & TDF_DETAILS))
3989     {
3990       fprintf (dump_file, "\n   size:%i", (int) size);
3991       if (est_times)
3992         fprintf (dump_file, " time:%f nonspec time:%f",
3993                  time.to_double (), nonspecialized_time.to_double ());
3994       if (est_hints)
3995         fprintf (dump_file, " loops with known iterations:%f "
3996                  "known strides:%f", loops_with_known_iterations.to_double (),
3997                  loops_with_known_strides.to_double ());
3998       fprintf (dump_file, "\n");
3999     }
4000   if (est_times)
4001     {
4002       estimates->time = time;
4003       estimates->nonspecialized_time = nonspecialized_time;
4004     }
4005   estimates->size = size;
4006   estimates->min_size = min_size;
4007   if (est_hints)
4008     estimates->hints = hints;
4009   return;
4010 }
4011
4012
4013 /* Estimate size and time needed to execute callee of EDGE assuming that
4014    parameters known to be constant at caller of EDGE are propagated.
4015    KNOWN_VALS and KNOWN_CONTEXTS are vectors of assumed known constant values
4016    and types for parameters.  */
4017
4018 void
4019 estimate_ipcp_clone_size_and_time (struct cgraph_node *node,
4020                                    ipa_auto_call_arg_values *avals,
4021                                    ipa_call_estimates *estimates)
4022 {
4023   clause_t clause, nonspec_clause;
4024
4025   evaluate_conditions_for_known_args (node, false, avals, &clause,
4026                                       &nonspec_clause, NULL);
4027   ipa_call_context ctx (node, clause, nonspec_clause, vNULL, avals);
4028   ctx.estimate_size_and_time (estimates);
4029 }
4030
4031 /* Return stack frame offset where frame of NODE is supposed to start inside
4032    of the function it is inlined to.
4033    Return 0 for functions that are not inlined.  */
4034
4035 HOST_WIDE_INT
4036 ipa_get_stack_frame_offset (struct cgraph_node *node)
4037 {
4038   HOST_WIDE_INT offset = 0;
4039   if (!node->inlined_to)
4040     return 0;
4041   node = node->callers->caller;
4042   while (true)
4043     {
4044       offset += ipa_size_summaries->get (node)->estimated_self_stack_size;
4045       if (!node->inlined_to)
4046         return offset;
4047       node = node->callers->caller;
4048     }
4049 }
4050
4051
4052 /* Update summary information of inline clones after inlining.
4053    Compute peak stack usage.  */
4054
4055 static void
4056 inline_update_callee_summaries (struct cgraph_node *node, int depth)
4057 {
4058   struct cgraph_edge *e;
4059
4060   ipa_propagate_frequency (node);
4061   for (e = node->callees; e; e = e->next_callee)
4062     {
4063       if (!e->inline_failed)
4064         inline_update_callee_summaries (e->callee, depth);
4065       else
4066         ipa_call_summaries->get (e)->loop_depth += depth;
4067     }
4068   for (e = node->indirect_calls; e; e = e->next_callee)
4069     ipa_call_summaries->get (e)->loop_depth += depth;
4070 }
4071
4072 /* Update change_prob and points_to_local_or_readonly_memory of EDGE after
4073    INLINED_EDGE has been inlined.
4074
4075    When function A is inlined in B and A calls C with parameter that
4076    changes with probability PROB1 and C is known to be passthrough
4077    of argument if B that change with probability PROB2, the probability
4078    of change is now PROB1*PROB2.  */
4079
4080 static void
4081 remap_edge_params (struct cgraph_edge *inlined_edge,
4082                    struct cgraph_edge *edge)
4083 {
4084   if (ipa_node_params_sum)
4085     {
4086       int i;
4087       ipa_edge_args *args = ipa_edge_args_sum->get (edge);
4088       if (!args)
4089         return;
4090       class ipa_call_summary *es = ipa_call_summaries->get (edge);
4091       class ipa_call_summary *inlined_es
4092         = ipa_call_summaries->get (inlined_edge);
4093
4094       if (es->param.length () == 0)
4095         return;
4096
4097       for (i = 0; i < ipa_get_cs_argument_count (args); i++)
4098         {
4099           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
4100           if (jfunc->type == IPA_JF_PASS_THROUGH
4101               || jfunc->type == IPA_JF_ANCESTOR)
4102             {
4103               int id = jfunc->type == IPA_JF_PASS_THROUGH
4104                        ? ipa_get_jf_pass_through_formal_id (jfunc)
4105                        : ipa_get_jf_ancestor_formal_id (jfunc);
4106               if (id < (int) inlined_es->param.length ())
4107                 {
4108                   int prob1 = es->param[i].change_prob;
4109                   int prob2 = inlined_es->param[id].change_prob;
4110                   int prob = combine_probabilities (prob1, prob2);
4111
4112                   if (prob1 && prob2 && !prob)
4113                     prob = 1;
4114
4115                   es->param[i].change_prob = prob;
4116
4117                   if (inlined_es
4118                         ->param[id].points_to_local_or_readonly_memory)
4119                     es->param[i].points_to_local_or_readonly_memory = true;
4120                   if (inlined_es
4121                         ->param[id].points_to_possible_sra_candidate)
4122                     es->param[i].points_to_possible_sra_candidate = true;
4123                 }
4124               if (!es->param[i].points_to_local_or_readonly_memory
4125                   && jfunc->type == IPA_JF_CONST
4126                   && points_to_local_or_readonly_memory_p
4127                          (ipa_get_jf_constant (jfunc)))
4128                 es->param[i].points_to_local_or_readonly_memory = true;
4129             }
4130         }
4131     }
4132 }
4133
4134 /* Update edge summaries of NODE after INLINED_EDGE has been inlined.
4135
4136    Remap predicates of callees of NODE.  Rest of arguments match
4137    remap_predicate.
4138
4139    Also update change probabilities.  */
4140
4141 static void
4142 remap_edge_summaries (struct cgraph_edge *inlined_edge,
4143                       struct cgraph_node *node,
4144                       class ipa_fn_summary *info,
4145                       class ipa_node_params *params_summary,
4146                       class ipa_fn_summary *callee_info,
4147                       const vec<int> &operand_map,
4148                       const vec<HOST_WIDE_INT> &offset_map,
4149                       clause_t possible_truths,
4150                       ipa_predicate *toplev_predicate)
4151 {
4152   struct cgraph_edge *e, *next;
4153   for (e = node->callees; e; e = next)
4154     {
4155       ipa_predicate p;
4156       next = e->next_callee;
4157
4158       if (e->inline_failed)
4159         {
4160           class ipa_call_summary *es = ipa_call_summaries->get (e);
4161           remap_edge_params (inlined_edge, e);
4162
4163           if (es->predicate)
4164             {
4165               p = es->predicate->remap_after_inlining
4166                                      (info, params_summary,
4167                                       callee_info, operand_map,
4168                                       offset_map, possible_truths,
4169                                       *toplev_predicate);
4170               edge_set_predicate (e, &p);
4171             }
4172           else
4173             edge_set_predicate (e, toplev_predicate);
4174         }
4175       else
4176         remap_edge_summaries (inlined_edge, e->callee, info,
4177                               params_summary, callee_info,
4178                               operand_map, offset_map, possible_truths,
4179                               toplev_predicate);
4180     }
4181   for (e = node->indirect_calls; e; e = next)
4182     {
4183       class ipa_call_summary *es = ipa_call_summaries->get (e);
4184       ipa_predicate p;
4185       next = e->next_callee;
4186
4187       remap_edge_params (inlined_edge, e);
4188       if (es->predicate)
4189         {
4190           p = es->predicate->remap_after_inlining
4191                                  (info, params_summary,
4192                                   callee_info, operand_map, offset_map,
4193                                   possible_truths, *toplev_predicate);
4194           edge_set_predicate (e, &p);
4195         }
4196       else
4197         edge_set_predicate (e, toplev_predicate);
4198     }
4199 }
4200
4201 /* Run remap_after_inlining on each predicate in V.  */
4202
4203 static void
4204 remap_freqcounting_predicate (class ipa_fn_summary *info,
4205                               class ipa_node_params *params_summary,
4206                               class ipa_fn_summary *callee_info,
4207                               vec<ipa_freqcounting_predicate, va_gc> *v,
4208                               const vec<int> &operand_map,
4209                               const vec<HOST_WIDE_INT> &offset_map,
4210                               clause_t possible_truths,
4211                               ipa_predicate *toplev_predicate)
4212
4213 {
4214   ipa_freqcounting_predicate *fcp;
4215   for (int i = 0; vec_safe_iterate (v, i, &fcp); i++)
4216     {
4217       ipa_predicate p
4218         = fcp->predicate->remap_after_inlining (info, params_summary,
4219                                                 callee_info, operand_map,
4220                                                 offset_map, possible_truths,
4221                                                 *toplev_predicate);
4222       if (p != false && p != true)
4223         *fcp->predicate &= p;
4224     }
4225 }
4226
4227 /* We inlined EDGE.  Update summary of the function we inlined into.  */
4228
4229 void
4230 ipa_merge_fn_summary_after_inlining (struct cgraph_edge *edge)
4231 {
4232   ipa_fn_summary *callee_info = ipa_fn_summaries->get (edge->callee);
4233   struct cgraph_node *to = (edge->caller->inlined_to
4234                             ? edge->caller->inlined_to : edge->caller);
4235   class ipa_fn_summary *info = ipa_fn_summaries->get (to);
4236   clause_t clause = 0;  /* not_inline is known to be false.  */
4237   size_time_entry *e;
4238   auto_vec<int, 8> operand_map;
4239   auto_vec<HOST_WIDE_INT, 8> offset_map;
4240   int i;
4241   ipa_predicate toplev_predicate;
4242   class ipa_call_summary *es = ipa_call_summaries->get (edge);
4243   ipa_node_params *params_summary = (ipa_node_params_sum
4244                                      ? ipa_node_params_sum->get (to) : NULL);
4245
4246   if (es->predicate)
4247     toplev_predicate = *es->predicate;
4248   else
4249     toplev_predicate = true;
4250
4251   info->fp_expressions |= callee_info->fp_expressions;
4252   info->target_info |= callee_info->target_info;
4253
4254   if (callee_info->conds)
4255     {
4256       ipa_auto_call_arg_values avals;
4257       evaluate_properties_for_edge (edge, true, &clause, NULL, &avals, false);
4258     }
4259   if (ipa_node_params_sum && callee_info->conds)
4260     {
4261       ipa_edge_args *args = ipa_edge_args_sum->get (edge);
4262       int count = args ? ipa_get_cs_argument_count (args) : 0;
4263       int i;
4264
4265       if (count)
4266         {
4267           operand_map.safe_grow_cleared (count, true);
4268           offset_map.safe_grow_cleared (count, true);
4269         }
4270       for (i = 0; i < count; i++)
4271         {
4272           struct ipa_jump_func *jfunc = ipa_get_ith_jump_func (args, i);
4273           int map = -1;
4274
4275           /* TODO: handle non-NOPs when merging.  */
4276           if (jfunc->type == IPA_JF_PASS_THROUGH)
4277             {
4278               if (ipa_get_jf_pass_through_operation (jfunc) == NOP_EXPR)
4279                 map = ipa_get_jf_pass_through_formal_id (jfunc);
4280               if (!ipa_get_jf_pass_through_agg_preserved (jfunc))
4281                 offset_map[i] = -1;
4282             }
4283           else if (jfunc->type == IPA_JF_ANCESTOR)
4284             {
4285               HOST_WIDE_INT offset = ipa_get_jf_ancestor_offset (jfunc);
4286               if (offset >= 0 && offset < INT_MAX)
4287                 {
4288                   map = ipa_get_jf_ancestor_formal_id (jfunc);
4289                   if (!ipa_get_jf_ancestor_agg_preserved (jfunc))
4290                     offset = -1;
4291                   offset_map[i] = offset;
4292                 }
4293             }
4294           operand_map[i] = map;
4295           gcc_assert (map < ipa_get_param_count (params_summary));
4296         }
4297
4298       int ip;
4299       for (i = 0; callee_info->builtin_constant_p_parms.iterate (i, &ip); i++)
4300         if (ip < count && operand_map[ip] >= 0)
4301           add_builtin_constant_p_parm (info, operand_map[ip]);
4302     }
4303   sreal freq = edge->sreal_frequency ();
4304   for (i = 0; callee_info->size_time_table.iterate (i, &e); i++)
4305     {
4306       ipa_predicate p;
4307       p = e->exec_predicate.remap_after_inlining
4308                              (info, params_summary,
4309                               callee_info, operand_map,
4310                               offset_map, clause,
4311                               toplev_predicate);
4312       ipa_predicate nonconstp;
4313       nonconstp = e->nonconst_predicate.remap_after_inlining
4314                                      (info, params_summary,
4315                                       callee_info, operand_map,
4316                                       offset_map, clause,
4317                                       toplev_predicate);
4318       if (p != false && nonconstp != false)
4319         {
4320           sreal add_time = ((sreal)e->time * freq);
4321           int prob = e->nonconst_predicate.probability (callee_info->conds,
4322                                                         clause, es->param);
4323           if (prob != REG_BR_PROB_BASE)
4324             add_time = add_time * prob / REG_BR_PROB_BASE;
4325           if (prob != REG_BR_PROB_BASE
4326               && dump_file && (dump_flags & TDF_DETAILS))
4327             {
4328               fprintf (dump_file, "\t\tScaling time by probability:%f\n",
4329                        (double) prob / REG_BR_PROB_BASE);
4330             }
4331           info->account_size_time (e->size, add_time, p, nonconstp);
4332         }
4333     }
4334   remap_edge_summaries (edge, edge->callee, info, params_summary,
4335                         callee_info, operand_map,
4336                         offset_map, clause, &toplev_predicate);
4337   remap_freqcounting_predicate (info, params_summary, callee_info,
4338                                 info->loop_iterations, operand_map,
4339                                 offset_map, clause, &toplev_predicate);
4340   remap_freqcounting_predicate (info, params_summary, callee_info,
4341                                 info->loop_strides, operand_map,
4342                                 offset_map, clause, &toplev_predicate);
4343
4344   HOST_WIDE_INT stack_frame_offset = ipa_get_stack_frame_offset (edge->callee);
4345   HOST_WIDE_INT peak = stack_frame_offset + callee_info->estimated_stack_size;
4346
4347   if (info->estimated_stack_size < peak)
4348     info->estimated_stack_size = peak;
4349
4350   inline_update_callee_summaries (edge->callee, es->loop_depth);
4351   if (info->call_size_time_table.length ())
4352     {
4353       int edge_size = 0;
4354       sreal edge_time = 0;
4355
4356       estimate_edge_size_and_time (edge, &edge_size, NULL, &edge_time, NULL, 0);
4357       /* Unaccount size and time of the optimized out call.  */
4358       info->account_size_time (-edge_size, -edge_time,
4359                                es->predicate ? *es->predicate : true,
4360                                es->predicate ? *es->predicate : true,
4361                                true);
4362       /* Account new calls.  */
4363       summarize_calls_size_and_time (edge->callee, info);
4364     }
4365
4366   /* Free summaries that are not maintained for inline clones/edges.  */
4367   ipa_call_summaries->remove (edge);
4368   ipa_fn_summaries->remove (edge->callee);
4369   ipa_remove_from_growth_caches (edge);
4370 }
4371
4372 /* For performance reasons ipa_merge_fn_summary_after_inlining is not updating
4373    overall size and time.  Recompute it.
4374    If RESET is true also recompute call_time_size_table.  */
4375
4376 void
4377 ipa_update_overall_fn_summary (struct cgraph_node *node, bool reset)
4378 {
4379   class ipa_fn_summary *info = ipa_fn_summaries->get (node);
4380   class ipa_size_summary *size_info = ipa_size_summaries->get (node);
4381   size_time_entry *e;
4382   int i;
4383
4384   size_info->size = 0;
4385   info->time = 0;
4386   for (i = 0; info->size_time_table.iterate (i, &e); i++)
4387     {
4388       size_info->size += e->size;
4389       info->time += e->time;
4390     }
4391   info->min_size = info->size_time_table[0].size;
4392   if (reset)
4393     info->call_size_time_table.release ();
4394   if (node->callees || node->indirect_calls)
4395     estimate_calls_size_and_time (node, &size_info->size, &info->min_size,
4396                                   &info->time, NULL,
4397                                   ~(clause_t) (1 << ipa_predicate::false_condition),
4398                                   NULL);
4399   size_info->size = RDIV (size_info->size, ipa_fn_summary::size_scale);
4400   info->min_size = RDIV (info->min_size, ipa_fn_summary::size_scale);
4401 }
4402
4403
4404 /* This function performs intraprocedural analysis in NODE that is required to
4405    inline indirect calls.  */
4406
4407 static void
4408 inline_indirect_intraprocedural_analysis (struct cgraph_node *node)
4409 {
4410   ipa_analyze_node (node);
4411   if (dump_file && (dump_flags & TDF_DETAILS))
4412     {
4413       ipa_print_node_params (dump_file, node);
4414       ipa_print_node_jump_functions (dump_file, node);
4415     }
4416 }
4417
4418
4419 /* Note function body size.  */
4420
4421 void
4422 inline_analyze_function (struct cgraph_node *node)
4423 {
4424   push_cfun (DECL_STRUCT_FUNCTION (node->decl));
4425
4426   if (dump_file)
4427     fprintf (dump_file, "\nAnalyzing function: %s\n", node->dump_name ());
4428   if (opt_for_fn (node->decl, optimize) && !node->thunk)
4429     inline_indirect_intraprocedural_analysis (node);
4430   compute_fn_summary (node, false);
4431   if (!optimize)
4432     {
4433       struct cgraph_edge *e;
4434       for (e = node->callees; e; e = e->next_callee)
4435         e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
4436       for (e = node->indirect_calls; e; e = e->next_callee)
4437         e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
4438     }
4439
4440   pop_cfun ();
4441 }
4442
4443
4444 /* Called when new function is inserted to callgraph late.  */
4445
4446 void
4447 ipa_fn_summary_t::insert (struct cgraph_node *node, ipa_fn_summary *)
4448 {
4449   inline_analyze_function (node);
4450 }
4451
4452 /* Note function body size.  */
4453
4454 static void
4455 ipa_fn_summary_generate (void)
4456 {
4457   struct cgraph_node *node;
4458
4459   FOR_EACH_DEFINED_FUNCTION (node)
4460     if (DECL_STRUCT_FUNCTION (node->decl))
4461       node->versionable = tree_versionable_function_p (node->decl);
4462
4463   ipa_fn_summary_alloc ();
4464
4465   ipa_fn_summaries->enable_insertion_hook ();
4466
4467   ipa_register_cgraph_hooks ();
4468
4469   FOR_EACH_DEFINED_FUNCTION (node)
4470     if (!node->alias
4471         && (flag_generate_lto || flag_generate_offload|| flag_wpa
4472             || opt_for_fn (node->decl, optimize)))
4473       inline_analyze_function (node);
4474 }
4475
4476
4477 /* Write inline summary for edge E to OB.  */
4478
4479 static void
4480 read_ipa_call_summary (class lto_input_block *ib, struct cgraph_edge *e,
4481                        bool prevails)
4482 {
4483   class ipa_call_summary *es = prevails
4484                                 ? ipa_call_summaries->get_create (e) : NULL;
4485   ipa_predicate p;
4486   int length, i;
4487
4488   int size = streamer_read_uhwi (ib);
4489   int time = streamer_read_uhwi (ib);
4490   int depth = streamer_read_uhwi (ib);
4491
4492   if (es)
4493     {
4494       es->call_stmt_size = size;
4495       es->call_stmt_time = time;
4496       es->loop_depth = depth;
4497     }
4498
4499   bitpack_d bp = streamer_read_bitpack (ib);
4500   if (es)
4501     es->is_return_callee_uncaptured = bp_unpack_value (&bp, 1);
4502   else
4503     bp_unpack_value (&bp, 1);
4504
4505   p.stream_in (ib);
4506   if (es)
4507     edge_set_predicate (e, &p);
4508   length = streamer_read_uhwi (ib);
4509   if (length && es
4510       && (e->possibly_call_in_translation_unit_p ()
4511           /* Also stream in jump functions to builtins in hope that they
4512              will get fnspecs.  */
4513           || fndecl_built_in_p (e->callee->decl, BUILT_IN_NORMAL)))
4514     {
4515       es->param.safe_grow_cleared (length, true);
4516       for (i = 0; i < length; i++)
4517         {
4518           es->param[i].change_prob = streamer_read_uhwi (ib);
4519           bitpack_d bp = streamer_read_bitpack (ib);
4520           es->param[i].points_to_local_or_readonly_memory
4521             = bp_unpack_value (&bp, 1);
4522           es->param[i].points_to_possible_sra_candidate
4523             = bp_unpack_value (&bp, 1);
4524         }
4525     }
4526   else
4527     {
4528       for (i = 0; i < length; i++)
4529         {
4530           streamer_read_uhwi (ib);
4531           streamer_read_uhwi (ib);
4532         }
4533     }
4534 }
4535
4536
4537 /* Stream in inline summaries from the section.  */
4538
4539 static void
4540 inline_read_section (struct lto_file_decl_data *file_data, const char *data,
4541                      size_t len)
4542 {
4543   const struct lto_function_header *header =
4544     (const struct lto_function_header *) data;
4545   const int cfg_offset = sizeof (struct lto_function_header);
4546   const int main_offset = cfg_offset + header->cfg_size;
4547   const int string_offset = main_offset + header->main_size;
4548   class data_in *data_in;
4549   unsigned int i, count2, j;
4550   unsigned int f_count;
4551
4552   lto_input_block ib ((const char *) data + main_offset, header->main_size,
4553                       file_data);
4554
4555   data_in =
4556     lto_data_in_create (file_data, (const char *) data + string_offset,
4557                         header->string_size, vNULL);
4558   f_count = streamer_read_uhwi (&ib);
4559   for (i = 0; i < f_count; i++)
4560     {
4561       unsigned int index;
4562       struct cgraph_node *node;
4563       class ipa_fn_summary *info;
4564       class ipa_node_params *params_summary;
4565       class ipa_size_summary *size_info;
4566       lto_symtab_encoder_t encoder;
4567       struct bitpack_d bp;
4568       struct cgraph_edge *e;
4569       ipa_predicate p;
4570
4571       index = streamer_read_uhwi (&ib);
4572       encoder = file_data->symtab_node_encoder;
4573       node = dyn_cast<cgraph_node *> (lto_symtab_encoder_deref (encoder,
4574                                                                 index));
4575       info = node->prevailing_p () ? ipa_fn_summaries->get_create (node) : NULL;
4576       params_summary = node->prevailing_p ()
4577                        ? ipa_node_params_sum->get (node) : NULL;
4578       size_info = node->prevailing_p ()
4579                   ? ipa_size_summaries->get_create (node) : NULL;
4580
4581       int stack_size = streamer_read_uhwi (&ib);
4582       int size = streamer_read_uhwi (&ib);
4583       sreal time = sreal::stream_in (&ib);
4584
4585       if (info)
4586         {
4587           info->estimated_stack_size
4588             = size_info->estimated_self_stack_size = stack_size;
4589           size_info->size = size_info->self_size = size;
4590           info->time = time;
4591         }
4592
4593       bp = streamer_read_bitpack (&ib);
4594       if (info)
4595         {
4596           info->inlinable = bp_unpack_value (&bp, 1);
4597           info->fp_expressions = bp_unpack_value (&bp, 1);
4598           if (!lto_stream_offload_p)
4599             info->target_info = streamer_read_uhwi (&ib);
4600         }
4601       else
4602         {
4603           bp_unpack_value (&bp, 1);
4604           bp_unpack_value (&bp, 1);
4605           if (!lto_stream_offload_p)
4606             streamer_read_uhwi (&ib);
4607         }
4608
4609       count2 = streamer_read_uhwi (&ib);
4610       gcc_assert (!info || !info->conds);
4611       if (info)
4612         vec_safe_reserve_exact (info->conds, count2);
4613       for (j = 0; j < count2; j++)
4614         {
4615           struct condition c;
4616           unsigned int k, count3;
4617           c.operand_num = streamer_read_uhwi (&ib);
4618           c.code = (enum tree_code) streamer_read_uhwi (&ib);
4619           c.type = stream_read_tree (&ib, data_in);
4620           c.val = stream_read_tree (&ib, data_in);
4621           bp = streamer_read_bitpack (&ib);
4622           c.agg_contents = bp_unpack_value (&bp, 1);
4623           c.by_ref = bp_unpack_value (&bp, 1);
4624           if (c.agg_contents)
4625             c.offset = streamer_read_uhwi (&ib);
4626           count3 = streamer_read_uhwi (&ib);
4627           c.param_ops = NULL;
4628           if (info)
4629             vec_safe_reserve_exact (c.param_ops, count3);
4630           if (params_summary)
4631             ipa_set_param_used_by_ipa_predicates
4632                     (params_summary, c.operand_num, true);
4633           for (k = 0; k < count3; k++)
4634             {
4635               struct expr_eval_op op;
4636               enum gimple_rhs_class rhs_class;
4637               op.code = (enum tree_code) streamer_read_uhwi (&ib);
4638               op.type = stream_read_tree (&ib, data_in);
4639               switch (rhs_class = get_gimple_rhs_class (op.code))
4640                 {
4641                 case GIMPLE_UNARY_RHS:
4642                   op.index = 0;
4643                   op.val[0] = NULL_TREE;
4644                   op.val[1] = NULL_TREE;
4645                   break;
4646
4647                 case GIMPLE_BINARY_RHS:
4648                 case GIMPLE_TERNARY_RHS:
4649                   bp = streamer_read_bitpack (&ib);
4650                   op.index = bp_unpack_value (&bp, 2);
4651                   op.val[0] = stream_read_tree (&ib, data_in);
4652                   if (rhs_class == GIMPLE_BINARY_RHS)
4653                     op.val[1] = NULL_TREE;
4654                   else
4655                     op.val[1] = stream_read_tree (&ib, data_in);
4656                   break;
4657
4658                 default:
4659                   fatal_error (UNKNOWN_LOCATION,
4660                                "invalid fnsummary in LTO stream");
4661                 }
4662               if (info)
4663                 c.param_ops->quick_push (op);
4664             }
4665           if (info)
4666             info->conds->quick_push (c);
4667         }
4668       count2 = streamer_read_uhwi (&ib);
4669       gcc_assert (!info || !info->size_time_table.length ());
4670       if (info && count2)
4671         info->size_time_table.reserve_exact (count2);
4672       for (j = 0; j < count2; j++)
4673         {
4674           class size_time_entry e;
4675
4676           e.size = streamer_read_uhwi (&ib);
4677           e.time = sreal::stream_in (&ib);
4678           e.exec_predicate.stream_in (&ib);
4679           e.nonconst_predicate.stream_in (&ib);
4680
4681           if (info)
4682             info->size_time_table.quick_push (e);
4683         }
4684
4685       count2 = streamer_read_uhwi (&ib);
4686       for (j = 0; j < count2; j++)
4687         {
4688           p.stream_in (&ib);
4689           sreal fcp_freq = sreal::stream_in (&ib);
4690           if (info)
4691             {
4692               ipa_freqcounting_predicate fcp;
4693               fcp.predicate = NULL;
4694               set_hint_predicate (&fcp.predicate, p);
4695               fcp.freq = fcp_freq;
4696               vec_safe_push (info->loop_iterations, fcp);
4697             }
4698         }
4699       count2 = streamer_read_uhwi (&ib);
4700       for (j = 0; j < count2; j++)
4701         {
4702           p.stream_in (&ib);
4703           sreal fcp_freq = sreal::stream_in (&ib);
4704           if (info)
4705             {
4706               ipa_freqcounting_predicate fcp;
4707               fcp.predicate = NULL;
4708               set_hint_predicate (&fcp.predicate, p);
4709               fcp.freq = fcp_freq;
4710               vec_safe_push (info->loop_strides, fcp);
4711             }
4712         }
4713       count2 = streamer_read_uhwi (&ib);
4714       if (info && count2)
4715         info->builtin_constant_p_parms.reserve_exact (count2);
4716       for (j = 0; j < count2; j++)
4717         {
4718           int parm = streamer_read_uhwi (&ib);
4719           if (info)
4720             info->builtin_constant_p_parms.quick_push (parm);
4721         }
4722       for (e = node->callees; e; e = e->next_callee)
4723         read_ipa_call_summary (&ib, e, info != NULL);
4724       for (e = node->indirect_calls; e; e = e->next_callee)
4725         read_ipa_call_summary (&ib, e, info != NULL);
4726     }
4727
4728   lto_free_section_data (file_data, LTO_section_ipa_fn_summary, NULL, data,
4729                          len);
4730   lto_data_in_delete (data_in);
4731 }
4732
4733
4734 /* Read inline summary.  Jump functions are shared among ipa-cp
4735    and inliner, so when ipa-cp is active, we don't need to write them
4736    twice.  */
4737
4738 static void
4739 ipa_fn_summary_read (void)
4740 {
4741   struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
4742   struct lto_file_decl_data *file_data;
4743   unsigned int j = 0;
4744
4745   ipa_prop_read_jump_functions ();
4746   ipa_fn_summary_alloc ();
4747
4748   while ((file_data = file_data_vec[j++]))
4749     {
4750       size_t len;
4751       const char *data
4752         = lto_get_summary_section_data (file_data, LTO_section_ipa_fn_summary,
4753                                         &len);
4754       if (data)
4755         inline_read_section (file_data, data, len);
4756       else
4757         /* Fatal error here.  We do not want to support compiling ltrans units
4758            with different version of compiler or different flags than the WPA
4759            unit, so this should never happen.  */
4760         fatal_error (input_location,
4761                      "ipa inline summary is missing in input file");
4762     }
4763   ipa_register_cgraph_hooks ();
4764
4765   gcc_assert (ipa_fn_summaries);
4766   ipa_fn_summaries->enable_insertion_hook ();
4767 }
4768
4769
4770 /* Write inline summary for edge E to OB.  */
4771
4772 static void
4773 write_ipa_call_summary (struct output_block *ob, struct cgraph_edge *e)
4774 {
4775   class ipa_call_summary *es = ipa_call_summaries->get (e);
4776   int i;
4777
4778   streamer_write_uhwi (ob, es->call_stmt_size);
4779   streamer_write_uhwi (ob, es->call_stmt_time);
4780   streamer_write_uhwi (ob, es->loop_depth);
4781
4782   bitpack_d bp = bitpack_create (ob->main_stream);
4783   bp_pack_value (&bp, es->is_return_callee_uncaptured, 1);
4784   streamer_write_bitpack (&bp);
4785
4786   if (es->predicate)
4787     es->predicate->stream_out (ob);
4788   else
4789     streamer_write_uhwi (ob, 0);
4790   streamer_write_uhwi (ob, es->param.length ());
4791   for (i = 0; i < (int) es->param.length (); i++)
4792     {
4793       streamer_write_uhwi (ob, es->param[i].change_prob);
4794       bp = bitpack_create (ob->main_stream);
4795       bp_pack_value (&bp, es->param[i].points_to_local_or_readonly_memory, 1);
4796       bp_pack_value (&bp, es->param[i].points_to_possible_sra_candidate, 1);
4797       streamer_write_bitpack (&bp);
4798     }
4799 }
4800
4801
4802 /* Write inline summary for node in SET.
4803    Jump functions are shared among ipa-cp and inliner, so when ipa-cp is
4804    active, we don't need to write them twice.  */
4805
4806 static void
4807 ipa_fn_summary_write (void)
4808 {
4809   struct output_block *ob = create_output_block (LTO_section_ipa_fn_summary);
4810   lto_symtab_encoder_iterator lsei;
4811   lto_symtab_encoder_t encoder = ob->decl_state->symtab_node_encoder;
4812   unsigned int count = 0;
4813
4814   for (lsei = lsei_start_function_in_partition (encoder); !lsei_end_p (lsei);
4815        lsei_next_function_in_partition (&lsei))
4816     {
4817       cgraph_node *cnode = lsei_cgraph_node (lsei);
4818       if (cnode->definition && !cnode->alias)
4819         count++;
4820     }
4821   streamer_write_uhwi (ob, count);
4822
4823   for (lsei = lsei_start_function_in_partition (encoder); !lsei_end_p (lsei);
4824        lsei_next_function_in_partition (&lsei))
4825     {
4826       cgraph_node *cnode = lsei_cgraph_node (lsei);
4827       if (cnode->definition && !cnode->alias)
4828         {
4829           class ipa_fn_summary *info = ipa_fn_summaries->get (cnode);
4830           class ipa_size_summary *size_info = ipa_size_summaries->get (cnode);
4831           struct bitpack_d bp;
4832           struct cgraph_edge *edge;
4833           int i;
4834           size_time_entry *e;
4835           struct condition *c;
4836
4837           streamer_write_uhwi (ob, lto_symtab_encoder_encode (encoder, cnode));
4838           streamer_write_hwi (ob, size_info->estimated_self_stack_size);
4839           streamer_write_hwi (ob, size_info->self_size);
4840           info->time.stream_out (ob);
4841           bp = bitpack_create (ob->main_stream);
4842           bp_pack_value (&bp, info->inlinable, 1);
4843           bp_pack_value (&bp, info->fp_expressions, 1);
4844           streamer_write_bitpack (&bp);
4845           if (!lto_stream_offload_p)
4846             streamer_write_uhwi (ob, info->target_info);
4847           streamer_write_uhwi (ob, vec_safe_length (info->conds));
4848           for (i = 0; vec_safe_iterate (info->conds, i, &c); i++)
4849             {
4850               int j;
4851               struct expr_eval_op *op;
4852
4853               streamer_write_uhwi (ob, c->operand_num);
4854               streamer_write_uhwi (ob, c->code);
4855               stream_write_tree (ob, c->type, true);
4856               stream_write_tree (ob, c->val, true);
4857               bp = bitpack_create (ob->main_stream);
4858               bp_pack_value (&bp, c->agg_contents, 1);
4859               bp_pack_value (&bp, c->by_ref, 1);
4860               streamer_write_bitpack (&bp);
4861               if (c->agg_contents)
4862                 streamer_write_uhwi (ob, c->offset);
4863               streamer_write_uhwi (ob, vec_safe_length (c->param_ops));
4864               for (j = 0; vec_safe_iterate (c->param_ops, j, &op); j++)
4865                 {
4866                   streamer_write_uhwi (ob, op->code);
4867                   stream_write_tree (ob, op->type, true);
4868                   if (op->val[0])
4869                     {
4870                       bp = bitpack_create (ob->main_stream);
4871                       bp_pack_value (&bp, op->index, 2);
4872                       streamer_write_bitpack (&bp);
4873                       stream_write_tree (ob, op->val[0], true);
4874                       if (op->val[1])
4875                         stream_write_tree (ob, op->val[1], true);
4876                     }
4877                 }
4878             }
4879           streamer_write_uhwi (ob, info->size_time_table.length ());
4880           for (i = 0; info->size_time_table.iterate (i, &e); i++)
4881             {
4882               streamer_write_uhwi (ob, e->size);
4883               e->time.stream_out (ob);
4884               e->exec_predicate.stream_out (ob);
4885               e->nonconst_predicate.stream_out (ob);
4886             }
4887           ipa_freqcounting_predicate *fcp;
4888           streamer_write_uhwi (ob, vec_safe_length (info->loop_iterations));
4889           for (i = 0; vec_safe_iterate (info->loop_iterations, i, &fcp); i++)
4890             {
4891               fcp->predicate->stream_out (ob);
4892               fcp->freq.stream_out (ob);
4893             }
4894           streamer_write_uhwi (ob, vec_safe_length (info->loop_strides));
4895           for (i = 0; vec_safe_iterate (info->loop_strides, i, &fcp); i++)
4896             {
4897               fcp->predicate->stream_out (ob);
4898               fcp->freq.stream_out (ob);
4899             }
4900           streamer_write_uhwi (ob, info->builtin_constant_p_parms.length ());
4901           int ip;
4902           for (i = 0; info->builtin_constant_p_parms.iterate (i, &ip);
4903                i++)
4904             streamer_write_uhwi (ob, ip);
4905           for (edge = cnode->callees; edge; edge = edge->next_callee)
4906             write_ipa_call_summary (ob, edge);
4907           for (edge = cnode->indirect_calls; edge; edge = edge->next_callee)
4908             write_ipa_call_summary (ob, edge);
4909         }
4910     }
4911   streamer_write_char_stream (ob->main_stream, 0);
4912   produce_asm (ob, NULL);
4913   destroy_output_block (ob);
4914
4915   ipa_prop_write_jump_functions ();
4916 }
4917
4918
4919 /* Release function summary.  */
4920
4921 void
4922 ipa_free_fn_summary (void)
4923 {
4924   if (!ipa_call_summaries)
4925     return;
4926   ggc_delete (ipa_fn_summaries);
4927   ipa_fn_summaries = NULL;
4928   delete ipa_call_summaries;
4929   ipa_call_summaries = NULL;
4930   edge_predicate_pool.release ();
4931   /* During IPA this is one of largest datastructures to release.  */
4932   if (flag_wpa)
4933     ggc_trim ();
4934 }
4935
4936 /* Release function summary.  */
4937
4938 void
4939 ipa_free_size_summary (void)
4940 {
4941   if (!ipa_size_summaries)
4942     return;
4943   delete ipa_size_summaries;
4944   ipa_size_summaries = NULL;
4945 }
4946
4947 namespace {
4948
4949 const pass_data pass_data_local_fn_summary =
4950 {
4951   GIMPLE_PASS, /* type */
4952   "local-fnsummary", /* name */
4953   OPTGROUP_INLINE, /* optinfo_flags */
4954   TV_INLINE_PARAMETERS, /* tv_id */
4955   0, /* properties_required */
4956   0, /* properties_provided */
4957   0, /* properties_destroyed */
4958   0, /* todo_flags_start */
4959   0, /* todo_flags_finish */
4960 };
4961
4962 class pass_local_fn_summary : public gimple_opt_pass
4963 {
4964 public:
4965   pass_local_fn_summary (gcc::context *ctxt)
4966     : gimple_opt_pass (pass_data_local_fn_summary, ctxt)
4967   {}
4968
4969   /* opt_pass methods: */
4970   opt_pass * clone () final override
4971   {
4972     return new pass_local_fn_summary (m_ctxt);
4973   }
4974   unsigned int execute (function *) final override
4975     {
4976       return compute_fn_summary_for_current ();
4977     }
4978
4979 }; // class pass_local_fn_summary
4980
4981 } // anon namespace
4982
4983 gimple_opt_pass *
4984 make_pass_local_fn_summary (gcc::context *ctxt)
4985 {
4986   return new pass_local_fn_summary (ctxt);
4987 }
4988
4989
4990 /* Free inline summary.  */
4991
4992 namespace {
4993
4994 const pass_data pass_data_ipa_free_fn_summary =
4995 {
4996   SIMPLE_IPA_PASS, /* type */
4997   "free-fnsummary", /* name */
4998   OPTGROUP_NONE, /* optinfo_flags */
4999   TV_IPA_FREE_INLINE_SUMMARY, /* tv_id */
5000   0, /* properties_required */
5001   0, /* properties_provided */
5002   0, /* properties_destroyed */
5003   0, /* todo_flags_start */
5004   0, /* todo_flags_finish */
5005 };
5006
5007 class pass_ipa_free_fn_summary : public simple_ipa_opt_pass
5008 {
5009 public:
5010   pass_ipa_free_fn_summary (gcc::context *ctxt)
5011     : simple_ipa_opt_pass (pass_data_ipa_free_fn_summary, ctxt),
5012       small_p (false)
5013   {}
5014
5015   /* opt_pass methods: */
5016   opt_pass *clone () final override
5017   {
5018     return new pass_ipa_free_fn_summary (m_ctxt);
5019   }
5020   void set_pass_param (unsigned int n, bool param) final override
5021     {
5022       gcc_assert (n == 0);
5023       small_p = param;
5024     }
5025   bool gate (function *) final override { return true; }
5026   unsigned int execute (function *) final override
5027     {
5028       ipa_free_fn_summary ();
5029       /* Free ipa-prop structures if they are no longer needed.  */
5030       ipa_free_all_structures_after_iinln ();
5031       if (!flag_wpa)
5032         ipa_free_size_summary ();
5033       return 0;
5034     }
5035
5036 private:
5037   bool small_p;
5038 }; // class pass_ipa_free_fn_summary
5039
5040 } // anon namespace
5041
5042 simple_ipa_opt_pass *
5043 make_pass_ipa_free_fn_summary (gcc::context *ctxt)
5044 {
5045   return new pass_ipa_free_fn_summary (ctxt);
5046 }
5047
5048 namespace {
5049
5050 const pass_data pass_data_ipa_fn_summary =
5051 {
5052   IPA_PASS, /* type */
5053   "fnsummary", /* name */
5054   OPTGROUP_INLINE, /* optinfo_flags */
5055   TV_IPA_FNSUMMARY, /* tv_id */
5056   0, /* properties_required */
5057   0, /* properties_provided */
5058   0, /* properties_destroyed */
5059   0, /* todo_flags_start */
5060   ( TODO_dump_symtab ), /* todo_flags_finish */
5061 };
5062
5063 class pass_ipa_fn_summary : public ipa_opt_pass_d
5064 {
5065 public:
5066   pass_ipa_fn_summary (gcc::context *ctxt)
5067     : ipa_opt_pass_d (pass_data_ipa_fn_summary, ctxt,
5068                       ipa_fn_summary_generate, /* generate_summary */
5069                       ipa_fn_summary_write, /* write_summary */
5070                       ipa_fn_summary_read, /* read_summary */
5071                       NULL, /* write_optimization_summary */
5072                       NULL, /* read_optimization_summary */
5073                       NULL, /* stmt_fixup */
5074                       0, /* function_transform_todo_flags_start */
5075                       NULL, /* function_transform */
5076                       NULL) /* variable_transform */
5077   {}
5078
5079   /* opt_pass methods: */
5080   unsigned int execute (function *) final override { return 0; }
5081
5082 }; // class pass_ipa_fn_summary
5083
5084 } // anon namespace
5085
5086 ipa_opt_pass_d *
5087 make_pass_ipa_fn_summary (gcc::context *ctxt)
5088 {
5089   return new pass_ipa_fn_summary (ctxt);
5090 }
5091
5092 /* Reset all state within ipa-fnsummary.cc so that we can rerun the compiler
5093    within the same process.  For use by toplev::finalize.  */
5094
5095 void
5096 ipa_fnsummary_cc_finalize (void)
5097 {
5098   ipa_free_fn_summary ();
5099   ipa_free_size_summary ();
5100 }