[gcc]
[official-gcc.git] / gcc / tree-inline.c
blob4b937ca8daa2ee13ecb6ed054ab4e677b655d027
1 /* Tree inlining.
2 Copyright (C) 2001-2014 Free Software Foundation, Inc.
3 Contributed by Alexandre Oliva <aoliva@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "diagnostic-core.h"
26 #include "tree.h"
27 #include "stor-layout.h"
28 #include "calls.h"
29 #include "tree-inline.h"
30 #include "flags.h"
31 #include "params.h"
32 #include "input.h"
33 #include "insn-config.h"
34 #include "hashtab.h"
35 #include "langhooks.h"
36 #include "predict.h"
37 #include "vec.h"
38 #include "hash-set.h"
39 #include "machmode.h"
40 #include "hard-reg-set.h"
41 #include "function.h"
42 #include "dominance.h"
43 #include "cfg.h"
44 #include "cfganal.h"
45 #include "basic-block.h"
46 #include "tree-iterator.h"
47 #include "intl.h"
48 #include "tree-ssa-alias.h"
49 #include "internal-fn.h"
50 #include "gimple-fold.h"
51 #include "tree-eh.h"
52 #include "gimple-expr.h"
53 #include "is-a.h"
54 #include "gimple.h"
55 #include "gimplify.h"
56 #include "gimple-iterator.h"
57 #include "gimplify-me.h"
58 #include "gimple-walk.h"
59 #include "gimple-ssa.h"
60 #include "tree-cfg.h"
61 #include "tree-phinodes.h"
62 #include "ssa-iterators.h"
63 #include "stringpool.h"
64 #include "tree-ssanames.h"
65 #include "tree-into-ssa.h"
66 #include "expr.h"
67 #include "tree-dfa.h"
68 #include "tree-ssa.h"
69 #include "tree-pretty-print.h"
70 #include "except.h"
71 #include "debug.h"
72 #include "hash-map.h"
73 #include "plugin-api.h"
74 #include "ipa-ref.h"
75 #include "cgraph.h"
76 #include "alloc-pool.h"
77 #include "ipa-prop.h"
78 #include "value-prof.h"
79 #include "tree-pass.h"
80 #include "target.h"
81 #include "cfgloop.h"
82 #include "builtins.h"
83 #include "tree-chkp.h"
85 #include "rtl.h" /* FIXME: For asm_str_count. */
87 /* I'm not real happy about this, but we need to handle gimple and
88 non-gimple trees. */
90 /* Inlining, Cloning, Versioning, Parallelization
92 Inlining: a function body is duplicated, but the PARM_DECLs are
93 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
94 MODIFY_EXPRs that store to a dedicated returned-value variable.
95 The duplicated eh_region info of the copy will later be appended
96 to the info for the caller; the eh_region info in copied throwing
97 statements and RESX statements are adjusted accordingly.
99 Cloning: (only in C++) We have one body for a con/de/structor, and
100 multiple function decls, each with a unique parameter list.
101 Duplicate the body, using the given splay tree; some parameters
102 will become constants (like 0 or 1).
104 Versioning: a function body is duplicated and the result is a new
105 function rather than into blocks of an existing function as with
106 inlining. Some parameters will become constants.
108 Parallelization: a region of a function is duplicated resulting in
109 a new function. Variables may be replaced with complex expressions
110 to enable shared variable semantics.
112 All of these will simultaneously lookup any callgraph edges. If
113 we're going to inline the duplicated function body, and the given
114 function has some cloned callgraph nodes (one for each place this
115 function will be inlined) those callgraph edges will be duplicated.
116 If we're cloning the body, those callgraph edges will be
117 updated to point into the new body. (Note that the original
118 callgraph node and edge list will not be altered.)
120 See the CALL_EXPR handling case in copy_tree_body_r (). */
122 /* To Do:
124 o In order to make inlining-on-trees work, we pessimized
125 function-local static constants. In particular, they are now
126 always output, even when not addressed. Fix this by treating
127 function-local static constants just like global static
128 constants; the back-end already knows not to output them if they
129 are not needed.
131 o Provide heuristics to clamp inlining of recursive template
132 calls? */
135 /* Weights that estimate_num_insns uses to estimate the size of the
136 produced code. */
138 eni_weights eni_size_weights;
140 /* Weights that estimate_num_insns uses to estimate the time necessary
141 to execute the produced code. */
143 eni_weights eni_time_weights;
145 /* Prototypes. */
147 static tree declare_return_variable (copy_body_data *, tree, tree, tree,
148 basic_block);
149 static void remap_block (tree *, copy_body_data *);
150 static void copy_bind_expr (tree *, int *, copy_body_data *);
151 static void declare_inline_vars (tree, tree);
152 static void remap_save_expr (tree *, hash_map<tree, tree> *, int *);
153 static void prepend_lexical_block (tree current_block, tree new_block);
154 static tree copy_decl_to_var (tree, copy_body_data *);
155 static tree copy_result_decl_to_var (tree, copy_body_data *);
156 static tree copy_decl_maybe_to_var (tree, copy_body_data *);
157 static gimple_seq remap_gimple_stmt (gimple, copy_body_data *);
158 static bool delete_unreachable_blocks_update_callgraph (copy_body_data *id);
159 static void insert_init_stmt (copy_body_data *, basic_block, gimple);
161 /* Insert a tree->tree mapping for ID. Despite the name suggests
162 that the trees should be variables, it is used for more than that. */
164 void
165 insert_decl_map (copy_body_data *id, tree key, tree value)
167 id->decl_map->put (key, value);
169 /* Always insert an identity map as well. If we see this same new
170 node again, we won't want to duplicate it a second time. */
171 if (key != value)
172 id->decl_map->put (value, value);
175 /* Insert a tree->tree mapping for ID. This is only used for
176 variables. */
178 static void
179 insert_debug_decl_map (copy_body_data *id, tree key, tree value)
181 if (!gimple_in_ssa_p (id->src_cfun))
182 return;
184 if (!MAY_HAVE_DEBUG_STMTS)
185 return;
187 if (!target_for_debug_bind (key))
188 return;
190 gcc_assert (TREE_CODE (key) == PARM_DECL);
191 gcc_assert (TREE_CODE (value) == VAR_DECL);
193 if (!id->debug_map)
194 id->debug_map = new hash_map<tree, tree>;
196 id->debug_map->put (key, value);
199 /* If nonzero, we're remapping the contents of inlined debug
200 statements. If negative, an error has occurred, such as a
201 reference to a variable that isn't available in the inlined
202 context. */
203 static int processing_debug_stmt = 0;
205 /* Construct new SSA name for old NAME. ID is the inline context. */
207 static tree
208 remap_ssa_name (tree name, copy_body_data *id)
210 tree new_tree, var;
211 tree *n;
213 gcc_assert (TREE_CODE (name) == SSA_NAME);
215 n = id->decl_map->get (name);
216 if (n)
217 return unshare_expr (*n);
219 if (processing_debug_stmt)
221 if (SSA_NAME_IS_DEFAULT_DEF (name)
222 && TREE_CODE (SSA_NAME_VAR (name)) == PARM_DECL
223 && id->entry_bb == NULL
224 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (cfun)))
226 tree vexpr = make_node (DEBUG_EXPR_DECL);
227 gimple def_temp;
228 gimple_stmt_iterator gsi;
229 tree val = SSA_NAME_VAR (name);
231 n = id->decl_map->get (val);
232 if (n != NULL)
233 val = *n;
234 if (TREE_CODE (val) != PARM_DECL)
236 processing_debug_stmt = -1;
237 return name;
239 def_temp = gimple_build_debug_source_bind (vexpr, val, NULL);
240 DECL_ARTIFICIAL (vexpr) = 1;
241 TREE_TYPE (vexpr) = TREE_TYPE (name);
242 DECL_MODE (vexpr) = DECL_MODE (SSA_NAME_VAR (name));
243 gsi = gsi_after_labels (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
244 gsi_insert_before (&gsi, def_temp, GSI_SAME_STMT);
245 return vexpr;
248 processing_debug_stmt = -1;
249 return name;
252 /* Remap anonymous SSA names or SSA names of anonymous decls. */
253 var = SSA_NAME_VAR (name);
254 if (!var
255 || (!SSA_NAME_IS_DEFAULT_DEF (name)
256 && TREE_CODE (var) == VAR_DECL
257 && !VAR_DECL_IS_VIRTUAL_OPERAND (var)
258 && DECL_ARTIFICIAL (var)
259 && DECL_IGNORED_P (var)
260 && !DECL_NAME (var)))
262 struct ptr_info_def *pi;
263 new_tree = make_ssa_name (remap_type (TREE_TYPE (name), id), NULL);
264 if (!var && SSA_NAME_IDENTIFIER (name))
265 SET_SSA_NAME_VAR_OR_IDENTIFIER (new_tree, SSA_NAME_IDENTIFIER (name));
266 insert_decl_map (id, name, new_tree);
267 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
268 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
269 /* At least IPA points-to info can be directly transferred. */
270 if (id->src_cfun->gimple_df
271 && id->src_cfun->gimple_df->ipa_pta
272 && (pi = SSA_NAME_PTR_INFO (name))
273 && !pi->pt.anything)
275 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
276 new_pi->pt = pi->pt;
278 return new_tree;
281 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
282 in copy_bb. */
283 new_tree = remap_decl (var, id);
285 /* We might've substituted constant or another SSA_NAME for
286 the variable.
288 Replace the SSA name representing RESULT_DECL by variable during
289 inlining: this saves us from need to introduce PHI node in a case
290 return value is just partly initialized. */
291 if ((TREE_CODE (new_tree) == VAR_DECL || TREE_CODE (new_tree) == PARM_DECL)
292 && (!SSA_NAME_VAR (name)
293 || TREE_CODE (SSA_NAME_VAR (name)) != RESULT_DECL
294 || !id->transform_return_to_modify))
296 struct ptr_info_def *pi;
297 new_tree = make_ssa_name (new_tree, NULL);
298 insert_decl_map (id, name, new_tree);
299 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
300 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
301 /* At least IPA points-to info can be directly transferred. */
302 if (id->src_cfun->gimple_df
303 && id->src_cfun->gimple_df->ipa_pta
304 && (pi = SSA_NAME_PTR_INFO (name))
305 && !pi->pt.anything)
307 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
308 new_pi->pt = pi->pt;
310 if (SSA_NAME_IS_DEFAULT_DEF (name))
312 /* By inlining function having uninitialized variable, we might
313 extend the lifetime (variable might get reused). This cause
314 ICE in the case we end up extending lifetime of SSA name across
315 abnormal edge, but also increase register pressure.
317 We simply initialize all uninitialized vars by 0 except
318 for case we are inlining to very first BB. We can avoid
319 this for all BBs that are not inside strongly connected
320 regions of the CFG, but this is expensive to test. */
321 if (id->entry_bb
322 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name)
323 && (!SSA_NAME_VAR (name)
324 || TREE_CODE (SSA_NAME_VAR (name)) != PARM_DECL)
325 && (id->entry_bb != EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun),
326 0)->dest
327 || EDGE_COUNT (id->entry_bb->preds) != 1))
329 gimple_stmt_iterator gsi = gsi_last_bb (id->entry_bb);
330 gimple init_stmt;
331 tree zero = build_zero_cst (TREE_TYPE (new_tree));
333 init_stmt = gimple_build_assign (new_tree, zero);
334 gsi_insert_after (&gsi, init_stmt, GSI_NEW_STMT);
335 SSA_NAME_IS_DEFAULT_DEF (new_tree) = 0;
337 else
339 SSA_NAME_DEF_STMT (new_tree) = gimple_build_nop ();
340 set_ssa_default_def (cfun, SSA_NAME_VAR (new_tree), new_tree);
344 else
345 insert_decl_map (id, name, new_tree);
346 return new_tree;
349 /* Remap DECL during the copying of the BLOCK tree for the function. */
351 tree
352 remap_decl (tree decl, copy_body_data *id)
354 tree *n;
356 /* We only remap local variables in the current function. */
358 /* See if we have remapped this declaration. */
360 n = id->decl_map->get (decl);
362 if (!n && processing_debug_stmt)
364 processing_debug_stmt = -1;
365 return decl;
368 /* If we didn't already have an equivalent for this declaration,
369 create one now. */
370 if (!n)
372 /* Make a copy of the variable or label. */
373 tree t = id->copy_decl (decl, id);
375 /* Remember it, so that if we encounter this local entity again
376 we can reuse this copy. Do this early because remap_type may
377 need this decl for TYPE_STUB_DECL. */
378 insert_decl_map (id, decl, t);
380 if (!DECL_P (t))
381 return t;
383 /* Remap types, if necessary. */
384 TREE_TYPE (t) = remap_type (TREE_TYPE (t), id);
385 if (TREE_CODE (t) == TYPE_DECL)
386 DECL_ORIGINAL_TYPE (t) = remap_type (DECL_ORIGINAL_TYPE (t), id);
388 /* Remap sizes as necessary. */
389 walk_tree (&DECL_SIZE (t), copy_tree_body_r, id, NULL);
390 walk_tree (&DECL_SIZE_UNIT (t), copy_tree_body_r, id, NULL);
392 /* If fields, do likewise for offset and qualifier. */
393 if (TREE_CODE (t) == FIELD_DECL)
395 walk_tree (&DECL_FIELD_OFFSET (t), copy_tree_body_r, id, NULL);
396 if (TREE_CODE (DECL_CONTEXT (t)) == QUAL_UNION_TYPE)
397 walk_tree (&DECL_QUALIFIER (t), copy_tree_body_r, id, NULL);
400 return t;
403 if (id->do_not_unshare)
404 return *n;
405 else
406 return unshare_expr (*n);
409 static tree
410 remap_type_1 (tree type, copy_body_data *id)
412 tree new_tree, t;
414 /* We do need a copy. build and register it now. If this is a pointer or
415 reference type, remap the designated type and make a new pointer or
416 reference type. */
417 if (TREE_CODE (type) == POINTER_TYPE)
419 new_tree = build_pointer_type_for_mode (remap_type (TREE_TYPE (type), id),
420 TYPE_MODE (type),
421 TYPE_REF_CAN_ALIAS_ALL (type));
422 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
423 new_tree = build_type_attribute_qual_variant (new_tree,
424 TYPE_ATTRIBUTES (type),
425 TYPE_QUALS (type));
426 insert_decl_map (id, type, new_tree);
427 return new_tree;
429 else if (TREE_CODE (type) == REFERENCE_TYPE)
431 new_tree = build_reference_type_for_mode (remap_type (TREE_TYPE (type), id),
432 TYPE_MODE (type),
433 TYPE_REF_CAN_ALIAS_ALL (type));
434 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
435 new_tree = build_type_attribute_qual_variant (new_tree,
436 TYPE_ATTRIBUTES (type),
437 TYPE_QUALS (type));
438 insert_decl_map (id, type, new_tree);
439 return new_tree;
441 else
442 new_tree = copy_node (type);
444 insert_decl_map (id, type, new_tree);
446 /* This is a new type, not a copy of an old type. Need to reassociate
447 variants. We can handle everything except the main variant lazily. */
448 t = TYPE_MAIN_VARIANT (type);
449 if (type != t)
451 t = remap_type (t, id);
452 TYPE_MAIN_VARIANT (new_tree) = t;
453 TYPE_NEXT_VARIANT (new_tree) = TYPE_NEXT_VARIANT (t);
454 TYPE_NEXT_VARIANT (t) = new_tree;
456 else
458 TYPE_MAIN_VARIANT (new_tree) = new_tree;
459 TYPE_NEXT_VARIANT (new_tree) = NULL;
462 if (TYPE_STUB_DECL (type))
463 TYPE_STUB_DECL (new_tree) = remap_decl (TYPE_STUB_DECL (type), id);
465 /* Lazily create pointer and reference types. */
466 TYPE_POINTER_TO (new_tree) = NULL;
467 TYPE_REFERENCE_TO (new_tree) = NULL;
469 /* Copy all types that may contain references to local variables; be sure to
470 preserve sharing in between type and its main variant when possible. */
471 switch (TREE_CODE (new_tree))
473 case INTEGER_TYPE:
474 case REAL_TYPE:
475 case FIXED_POINT_TYPE:
476 case ENUMERAL_TYPE:
477 case BOOLEAN_TYPE:
478 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
480 gcc_checking_assert (TYPE_MIN_VALUE (type) == TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (type)));
481 gcc_checking_assert (TYPE_MAX_VALUE (type) == TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (type)));
483 TYPE_MIN_VALUE (new_tree) = TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (new_tree));
484 TYPE_MAX_VALUE (new_tree) = TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (new_tree));
486 else
488 t = TYPE_MIN_VALUE (new_tree);
489 if (t && TREE_CODE (t) != INTEGER_CST)
490 walk_tree (&TYPE_MIN_VALUE (new_tree), copy_tree_body_r, id, NULL);
492 t = TYPE_MAX_VALUE (new_tree);
493 if (t && TREE_CODE (t) != INTEGER_CST)
494 walk_tree (&TYPE_MAX_VALUE (new_tree), copy_tree_body_r, id, NULL);
496 return new_tree;
498 case FUNCTION_TYPE:
499 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
500 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
501 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
502 else
503 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
504 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
505 && TYPE_ARG_TYPES (type) == TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (type)))
506 TYPE_ARG_TYPES (new_tree) = TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (new_tree));
507 else
508 walk_tree (&TYPE_ARG_TYPES (new_tree), copy_tree_body_r, id, NULL);
509 return new_tree;
511 case ARRAY_TYPE:
512 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
513 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
514 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
515 else
516 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
518 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
520 gcc_checking_assert (TYPE_DOMAIN (type) == TYPE_DOMAIN (TYPE_MAIN_VARIANT (type)));
521 TYPE_DOMAIN (new_tree) = TYPE_DOMAIN (TYPE_MAIN_VARIANT (new_tree));
523 else
524 TYPE_DOMAIN (new_tree) = remap_type (TYPE_DOMAIN (new_tree), id);
525 break;
527 case RECORD_TYPE:
528 case UNION_TYPE:
529 case QUAL_UNION_TYPE:
530 if (TYPE_MAIN_VARIANT (type) != type
531 && TYPE_FIELDS (type) == TYPE_FIELDS (TYPE_MAIN_VARIANT (type)))
532 TYPE_FIELDS (new_tree) = TYPE_FIELDS (TYPE_MAIN_VARIANT (new_tree));
533 else
535 tree f, nf = NULL;
537 for (f = TYPE_FIELDS (new_tree); f ; f = DECL_CHAIN (f))
539 t = remap_decl (f, id);
540 DECL_CONTEXT (t) = new_tree;
541 DECL_CHAIN (t) = nf;
542 nf = t;
544 TYPE_FIELDS (new_tree) = nreverse (nf);
546 break;
548 case OFFSET_TYPE:
549 default:
550 /* Shouldn't have been thought variable sized. */
551 gcc_unreachable ();
554 /* All variants of type share the same size, so use the already remaped data. */
555 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
557 gcc_checking_assert (TYPE_SIZE (type) == TYPE_SIZE (TYPE_MAIN_VARIANT (type)));
558 gcc_checking_assert (TYPE_SIZE_UNIT (type) == TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (type)));
560 TYPE_SIZE (new_tree) = TYPE_SIZE (TYPE_MAIN_VARIANT (new_tree));
561 TYPE_SIZE_UNIT (new_tree) = TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (new_tree));
563 else
565 walk_tree (&TYPE_SIZE (new_tree), copy_tree_body_r, id, NULL);
566 walk_tree (&TYPE_SIZE_UNIT (new_tree), copy_tree_body_r, id, NULL);
569 return new_tree;
572 tree
573 remap_type (tree type, copy_body_data *id)
575 tree *node;
576 tree tmp;
578 if (type == NULL)
579 return type;
581 /* See if we have remapped this type. */
582 node = id->decl_map->get (type);
583 if (node)
584 return *node;
586 /* The type only needs remapping if it's variably modified. */
587 if (! variably_modified_type_p (type, id->src_fn))
589 insert_decl_map (id, type, type);
590 return type;
593 id->remapping_type_depth++;
594 tmp = remap_type_1 (type, id);
595 id->remapping_type_depth--;
597 return tmp;
600 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
602 static bool
603 can_be_nonlocal (tree decl, copy_body_data *id)
605 /* We can not duplicate function decls. */
606 if (TREE_CODE (decl) == FUNCTION_DECL)
607 return true;
609 /* Local static vars must be non-local or we get multiple declaration
610 problems. */
611 if (TREE_CODE (decl) == VAR_DECL
612 && !auto_var_in_fn_p (decl, id->src_fn))
613 return true;
615 return false;
618 static tree
619 remap_decls (tree decls, vec<tree, va_gc> **nonlocalized_list,
620 copy_body_data *id)
622 tree old_var;
623 tree new_decls = NULL_TREE;
625 /* Remap its variables. */
626 for (old_var = decls; old_var; old_var = DECL_CHAIN (old_var))
628 tree new_var;
630 if (can_be_nonlocal (old_var, id))
632 /* We need to add this variable to the local decls as otherwise
633 nothing else will do so. */
634 if (TREE_CODE (old_var) == VAR_DECL
635 && ! DECL_EXTERNAL (old_var))
636 add_local_decl (cfun, old_var);
637 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
638 && !DECL_IGNORED_P (old_var)
639 && nonlocalized_list)
640 vec_safe_push (*nonlocalized_list, old_var);
641 continue;
644 /* Remap the variable. */
645 new_var = remap_decl (old_var, id);
647 /* If we didn't remap this variable, we can't mess with its
648 TREE_CHAIN. If we remapped this variable to the return slot, it's
649 already declared somewhere else, so don't declare it here. */
651 if (new_var == id->retvar)
653 else if (!new_var)
655 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
656 && !DECL_IGNORED_P (old_var)
657 && nonlocalized_list)
658 vec_safe_push (*nonlocalized_list, old_var);
660 else
662 gcc_assert (DECL_P (new_var));
663 DECL_CHAIN (new_var) = new_decls;
664 new_decls = new_var;
666 /* Also copy value-expressions. */
667 if (TREE_CODE (new_var) == VAR_DECL
668 && DECL_HAS_VALUE_EXPR_P (new_var))
670 tree tem = DECL_VALUE_EXPR (new_var);
671 bool old_regimplify = id->regimplify;
672 id->remapping_type_depth++;
673 walk_tree (&tem, copy_tree_body_r, id, NULL);
674 id->remapping_type_depth--;
675 id->regimplify = old_regimplify;
676 SET_DECL_VALUE_EXPR (new_var, tem);
681 return nreverse (new_decls);
684 /* Copy the BLOCK to contain remapped versions of the variables
685 therein. And hook the new block into the block-tree. */
687 static void
688 remap_block (tree *block, copy_body_data *id)
690 tree old_block;
691 tree new_block;
693 /* Make the new block. */
694 old_block = *block;
695 new_block = make_node (BLOCK);
696 TREE_USED (new_block) = TREE_USED (old_block);
697 BLOCK_ABSTRACT_ORIGIN (new_block) = old_block;
698 BLOCK_SOURCE_LOCATION (new_block) = BLOCK_SOURCE_LOCATION (old_block);
699 BLOCK_NONLOCALIZED_VARS (new_block)
700 = vec_safe_copy (BLOCK_NONLOCALIZED_VARS (old_block));
701 *block = new_block;
703 /* Remap its variables. */
704 BLOCK_VARS (new_block) = remap_decls (BLOCK_VARS (old_block),
705 &BLOCK_NONLOCALIZED_VARS (new_block),
706 id);
708 if (id->transform_lang_insert_block)
709 id->transform_lang_insert_block (new_block);
711 /* Remember the remapped block. */
712 insert_decl_map (id, old_block, new_block);
715 /* Copy the whole block tree and root it in id->block. */
716 static tree
717 remap_blocks (tree block, copy_body_data *id)
719 tree t;
720 tree new_tree = block;
722 if (!block)
723 return NULL;
725 remap_block (&new_tree, id);
726 gcc_assert (new_tree != block);
727 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
728 prepend_lexical_block (new_tree, remap_blocks (t, id));
729 /* Blocks are in arbitrary order, but make things slightly prettier and do
730 not swap order when producing a copy. */
731 BLOCK_SUBBLOCKS (new_tree) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree));
732 return new_tree;
735 /* Remap the block tree rooted at BLOCK to nothing. */
736 static void
737 remap_blocks_to_null (tree block, copy_body_data *id)
739 tree t;
740 insert_decl_map (id, block, NULL_TREE);
741 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
742 remap_blocks_to_null (t, id);
745 static void
746 copy_statement_list (tree *tp)
748 tree_stmt_iterator oi, ni;
749 tree new_tree;
751 new_tree = alloc_stmt_list ();
752 ni = tsi_start (new_tree);
753 oi = tsi_start (*tp);
754 TREE_TYPE (new_tree) = TREE_TYPE (*tp);
755 *tp = new_tree;
757 for (; !tsi_end_p (oi); tsi_next (&oi))
759 tree stmt = tsi_stmt (oi);
760 if (TREE_CODE (stmt) == STATEMENT_LIST)
761 /* This copy is not redundant; tsi_link_after will smash this
762 STATEMENT_LIST into the end of the one we're building, and we
763 don't want to do that with the original. */
764 copy_statement_list (&stmt);
765 tsi_link_after (&ni, stmt, TSI_CONTINUE_LINKING);
769 static void
770 copy_bind_expr (tree *tp, int *walk_subtrees, copy_body_data *id)
772 tree block = BIND_EXPR_BLOCK (*tp);
773 /* Copy (and replace) the statement. */
774 copy_tree_r (tp, walk_subtrees, NULL);
775 if (block)
777 remap_block (&block, id);
778 BIND_EXPR_BLOCK (*tp) = block;
781 if (BIND_EXPR_VARS (*tp))
782 /* This will remap a lot of the same decls again, but this should be
783 harmless. */
784 BIND_EXPR_VARS (*tp) = remap_decls (BIND_EXPR_VARS (*tp), NULL, id);
788 /* Create a new gimple_seq by remapping all the statements in BODY
789 using the inlining information in ID. */
791 static gimple_seq
792 remap_gimple_seq (gimple_seq body, copy_body_data *id)
794 gimple_stmt_iterator si;
795 gimple_seq new_body = NULL;
797 for (si = gsi_start (body); !gsi_end_p (si); gsi_next (&si))
799 gimple_seq new_stmts = remap_gimple_stmt (gsi_stmt (si), id);
800 gimple_seq_add_seq (&new_body, new_stmts);
803 return new_body;
807 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
808 block using the mapping information in ID. */
810 static gimple
811 copy_gimple_bind (gimple stmt, copy_body_data *id)
813 gimple new_bind;
814 tree new_block, new_vars;
815 gimple_seq body, new_body;
817 /* Copy the statement. Note that we purposely don't use copy_stmt
818 here because we need to remap statements as we copy. */
819 body = gimple_bind_body (stmt);
820 new_body = remap_gimple_seq (body, id);
822 new_block = gimple_bind_block (stmt);
823 if (new_block)
824 remap_block (&new_block, id);
826 /* This will remap a lot of the same decls again, but this should be
827 harmless. */
828 new_vars = gimple_bind_vars (stmt);
829 if (new_vars)
830 new_vars = remap_decls (new_vars, NULL, id);
832 new_bind = gimple_build_bind (new_vars, new_body, new_block);
834 return new_bind;
837 /* Return true if DECL is a parameter or a SSA_NAME for a parameter. */
839 static bool
840 is_parm (tree decl)
842 if (TREE_CODE (decl) == SSA_NAME)
844 decl = SSA_NAME_VAR (decl);
845 if (!decl)
846 return false;
849 return (TREE_CODE (decl) == PARM_DECL);
852 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
853 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
854 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
855 recursing into the children nodes of *TP. */
857 static tree
858 remap_gimple_op_r (tree *tp, int *walk_subtrees, void *data)
860 struct walk_stmt_info *wi_p = (struct walk_stmt_info *) data;
861 copy_body_data *id = (copy_body_data *) wi_p->info;
862 tree fn = id->src_fn;
864 if (TREE_CODE (*tp) == SSA_NAME)
866 *tp = remap_ssa_name (*tp, id);
867 *walk_subtrees = 0;
868 return NULL;
870 else if (auto_var_in_fn_p (*tp, fn))
872 /* Local variables and labels need to be replaced by equivalent
873 variables. We don't want to copy static variables; there's
874 only one of those, no matter how many times we inline the
875 containing function. Similarly for globals from an outer
876 function. */
877 tree new_decl;
879 /* Remap the declaration. */
880 new_decl = remap_decl (*tp, id);
881 gcc_assert (new_decl);
882 /* Replace this variable with the copy. */
883 STRIP_TYPE_NOPS (new_decl);
884 /* ??? The C++ frontend uses void * pointer zero to initialize
885 any other type. This confuses the middle-end type verification.
886 As cloned bodies do not go through gimplification again the fixup
887 there doesn't trigger. */
888 if (TREE_CODE (new_decl) == INTEGER_CST
889 && !useless_type_conversion_p (TREE_TYPE (*tp), TREE_TYPE (new_decl)))
890 new_decl = fold_convert (TREE_TYPE (*tp), new_decl);
891 *tp = new_decl;
892 *walk_subtrees = 0;
894 else if (TREE_CODE (*tp) == STATEMENT_LIST)
895 gcc_unreachable ();
896 else if (TREE_CODE (*tp) == SAVE_EXPR)
897 gcc_unreachable ();
898 else if (TREE_CODE (*tp) == LABEL_DECL
899 && (!DECL_CONTEXT (*tp)
900 || decl_function_context (*tp) == id->src_fn))
901 /* These may need to be remapped for EH handling. */
902 *tp = remap_decl (*tp, id);
903 else if (TREE_CODE (*tp) == FIELD_DECL)
905 /* If the enclosing record type is variably_modified_type_p, the field
906 has already been remapped. Otherwise, it need not be. */
907 tree *n = id->decl_map->get (*tp);
908 if (n)
909 *tp = *n;
910 *walk_subtrees = 0;
912 else if (TYPE_P (*tp))
913 /* Types may need remapping as well. */
914 *tp = remap_type (*tp, id);
915 else if (CONSTANT_CLASS_P (*tp))
917 /* If this is a constant, we have to copy the node iff the type
918 will be remapped. copy_tree_r will not copy a constant. */
919 tree new_type = remap_type (TREE_TYPE (*tp), id);
921 if (new_type == TREE_TYPE (*tp))
922 *walk_subtrees = 0;
924 else if (TREE_CODE (*tp) == INTEGER_CST)
925 *tp = wide_int_to_tree (new_type, *tp);
926 else
928 *tp = copy_node (*tp);
929 TREE_TYPE (*tp) = new_type;
932 else
934 /* Otherwise, just copy the node. Note that copy_tree_r already
935 knows not to copy VAR_DECLs, etc., so this is safe. */
937 if (TREE_CODE (*tp) == MEM_REF)
939 /* We need to re-canonicalize MEM_REFs from inline substitutions
940 that can happen when a pointer argument is an ADDR_EXPR.
941 Recurse here manually to allow that. */
942 tree ptr = TREE_OPERAND (*tp, 0);
943 tree type = remap_type (TREE_TYPE (*tp), id);
944 tree old = *tp;
945 walk_tree (&ptr, remap_gimple_op_r, data, NULL);
946 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
947 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
948 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
949 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
950 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
951 remapped a parameter as the property might be valid only
952 for the parameter itself. */
953 if (TREE_THIS_NOTRAP (old)
954 && (!is_parm (TREE_OPERAND (old, 0))
955 || (!id->transform_parameter && is_parm (ptr))))
956 TREE_THIS_NOTRAP (*tp) = 1;
957 *walk_subtrees = 0;
958 return NULL;
961 /* Here is the "usual case". Copy this tree node, and then
962 tweak some special cases. */
963 copy_tree_r (tp, walk_subtrees, NULL);
965 if (TREE_CODE (*tp) != OMP_CLAUSE)
966 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
968 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
970 /* The copied TARGET_EXPR has never been expanded, even if the
971 original node was expanded already. */
972 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
973 TREE_OPERAND (*tp, 3) = NULL_TREE;
975 else if (TREE_CODE (*tp) == ADDR_EXPR)
977 /* Variable substitution need not be simple. In particular,
978 the MEM_REF substitution above. Make sure that
979 TREE_CONSTANT and friends are up-to-date. */
980 int invariant = is_gimple_min_invariant (*tp);
981 walk_tree (&TREE_OPERAND (*tp, 0), remap_gimple_op_r, data, NULL);
982 recompute_tree_invariant_for_addr_expr (*tp);
984 /* If this used to be invariant, but is not any longer,
985 then regimplification is probably needed. */
986 if (invariant && !is_gimple_min_invariant (*tp))
987 id->regimplify = true;
989 *walk_subtrees = 0;
993 /* Update the TREE_BLOCK for the cloned expr. */
994 if (EXPR_P (*tp))
996 tree new_block = id->remapping_type_depth == 0 ? id->block : NULL;
997 tree old_block = TREE_BLOCK (*tp);
998 if (old_block)
1000 tree *n;
1001 n = id->decl_map->get (TREE_BLOCK (*tp));
1002 if (n)
1003 new_block = *n;
1005 TREE_SET_BLOCK (*tp, new_block);
1008 /* Keep iterating. */
1009 return NULL_TREE;
1013 /* Called from copy_body_id via walk_tree. DATA is really a
1014 `copy_body_data *'. */
1016 tree
1017 copy_tree_body_r (tree *tp, int *walk_subtrees, void *data)
1019 copy_body_data *id = (copy_body_data *) data;
1020 tree fn = id->src_fn;
1021 tree new_block;
1023 /* Begin by recognizing trees that we'll completely rewrite for the
1024 inlining context. Our output for these trees is completely
1025 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1026 into an edge). Further down, we'll handle trees that get
1027 duplicated and/or tweaked. */
1029 /* When requested, RETURN_EXPRs should be transformed to just the
1030 contained MODIFY_EXPR. The branch semantics of the return will
1031 be handled elsewhere by manipulating the CFG rather than a statement. */
1032 if (TREE_CODE (*tp) == RETURN_EXPR && id->transform_return_to_modify)
1034 tree assignment = TREE_OPERAND (*tp, 0);
1036 /* If we're returning something, just turn that into an
1037 assignment into the equivalent of the original RESULT_DECL.
1038 If the "assignment" is just the result decl, the result
1039 decl has already been set (e.g. a recent "foo (&result_decl,
1040 ...)"); just toss the entire RETURN_EXPR. */
1041 if (assignment && TREE_CODE (assignment) == MODIFY_EXPR)
1043 /* Replace the RETURN_EXPR with (a copy of) the
1044 MODIFY_EXPR hanging underneath. */
1045 *tp = copy_node (assignment);
1047 else /* Else the RETURN_EXPR returns no value. */
1049 *tp = NULL;
1050 return (tree) (void *)1;
1053 else if (TREE_CODE (*tp) == SSA_NAME)
1055 *tp = remap_ssa_name (*tp, id);
1056 *walk_subtrees = 0;
1057 return NULL;
1060 /* Local variables and labels need to be replaced by equivalent
1061 variables. We don't want to copy static variables; there's only
1062 one of those, no matter how many times we inline the containing
1063 function. Similarly for globals from an outer function. */
1064 else if (auto_var_in_fn_p (*tp, fn))
1066 tree new_decl;
1068 /* Remap the declaration. */
1069 new_decl = remap_decl (*tp, id);
1070 gcc_assert (new_decl);
1071 /* Replace this variable with the copy. */
1072 STRIP_TYPE_NOPS (new_decl);
1073 *tp = new_decl;
1074 *walk_subtrees = 0;
1076 else if (TREE_CODE (*tp) == STATEMENT_LIST)
1077 copy_statement_list (tp);
1078 else if (TREE_CODE (*tp) == SAVE_EXPR
1079 || TREE_CODE (*tp) == TARGET_EXPR)
1080 remap_save_expr (tp, id->decl_map, walk_subtrees);
1081 else if (TREE_CODE (*tp) == LABEL_DECL
1082 && (! DECL_CONTEXT (*tp)
1083 || decl_function_context (*tp) == id->src_fn))
1084 /* These may need to be remapped for EH handling. */
1085 *tp = remap_decl (*tp, id);
1086 else if (TREE_CODE (*tp) == BIND_EXPR)
1087 copy_bind_expr (tp, walk_subtrees, id);
1088 /* Types may need remapping as well. */
1089 else if (TYPE_P (*tp))
1090 *tp = remap_type (*tp, id);
1092 /* If this is a constant, we have to copy the node iff the type will be
1093 remapped. copy_tree_r will not copy a constant. */
1094 else if (CONSTANT_CLASS_P (*tp))
1096 tree new_type = remap_type (TREE_TYPE (*tp), id);
1098 if (new_type == TREE_TYPE (*tp))
1099 *walk_subtrees = 0;
1101 else if (TREE_CODE (*tp) == INTEGER_CST)
1102 *tp = wide_int_to_tree (new_type, *tp);
1103 else
1105 *tp = copy_node (*tp);
1106 TREE_TYPE (*tp) = new_type;
1110 /* Otherwise, just copy the node. Note that copy_tree_r already
1111 knows not to copy VAR_DECLs, etc., so this is safe. */
1112 else
1114 /* Here we handle trees that are not completely rewritten.
1115 First we detect some inlining-induced bogosities for
1116 discarding. */
1117 if (TREE_CODE (*tp) == MODIFY_EXPR
1118 && TREE_OPERAND (*tp, 0) == TREE_OPERAND (*tp, 1)
1119 && (auto_var_in_fn_p (TREE_OPERAND (*tp, 0), fn)))
1121 /* Some assignments VAR = VAR; don't generate any rtl code
1122 and thus don't count as variable modification. Avoid
1123 keeping bogosities like 0 = 0. */
1124 tree decl = TREE_OPERAND (*tp, 0), value;
1125 tree *n;
1127 n = id->decl_map->get (decl);
1128 if (n)
1130 value = *n;
1131 STRIP_TYPE_NOPS (value);
1132 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1134 *tp = build_empty_stmt (EXPR_LOCATION (*tp));
1135 return copy_tree_body_r (tp, walk_subtrees, data);
1139 else if (TREE_CODE (*tp) == INDIRECT_REF)
1141 /* Get rid of *& from inline substitutions that can happen when a
1142 pointer argument is an ADDR_EXPR. */
1143 tree decl = TREE_OPERAND (*tp, 0);
1144 tree *n = id->decl_map->get (decl);
1145 if (n)
1147 /* If we happen to get an ADDR_EXPR in n->value, strip
1148 it manually here as we'll eventually get ADDR_EXPRs
1149 which lie about their types pointed to. In this case
1150 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1151 but we absolutely rely on that. As fold_indirect_ref
1152 does other useful transformations, try that first, though. */
1153 tree type = TREE_TYPE (*tp);
1154 tree ptr = id->do_not_unshare ? *n : unshare_expr (*n);
1155 tree old = *tp;
1156 *tp = gimple_fold_indirect_ref (ptr);
1157 if (! *tp)
1159 if (TREE_CODE (ptr) == ADDR_EXPR)
1162 = fold_indirect_ref_1 (EXPR_LOCATION (ptr), type, ptr);
1163 /* ??? We should either assert here or build
1164 a VIEW_CONVERT_EXPR instead of blindly leaking
1165 incompatible types to our IL. */
1166 if (! *tp)
1167 *tp = TREE_OPERAND (ptr, 0);
1169 else
1171 *tp = build1 (INDIRECT_REF, type, ptr);
1172 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1173 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1174 TREE_READONLY (*tp) = TREE_READONLY (old);
1175 /* We cannot propagate the TREE_THIS_NOTRAP flag if we
1176 have remapped a parameter as the property might be
1177 valid only for the parameter itself. */
1178 if (TREE_THIS_NOTRAP (old)
1179 && (!is_parm (TREE_OPERAND (old, 0))
1180 || (!id->transform_parameter && is_parm (ptr))))
1181 TREE_THIS_NOTRAP (*tp) = 1;
1184 *walk_subtrees = 0;
1185 return NULL;
1188 else if (TREE_CODE (*tp) == MEM_REF)
1190 /* We need to re-canonicalize MEM_REFs from inline substitutions
1191 that can happen when a pointer argument is an ADDR_EXPR.
1192 Recurse here manually to allow that. */
1193 tree ptr = TREE_OPERAND (*tp, 0);
1194 tree type = remap_type (TREE_TYPE (*tp), id);
1195 tree old = *tp;
1196 walk_tree (&ptr, copy_tree_body_r, data, NULL);
1197 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
1198 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1199 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1200 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
1201 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
1202 remapped a parameter as the property might be valid only
1203 for the parameter itself. */
1204 if (TREE_THIS_NOTRAP (old)
1205 && (!is_parm (TREE_OPERAND (old, 0))
1206 || (!id->transform_parameter && is_parm (ptr))))
1207 TREE_THIS_NOTRAP (*tp) = 1;
1208 *walk_subtrees = 0;
1209 return NULL;
1212 /* Here is the "usual case". Copy this tree node, and then
1213 tweak some special cases. */
1214 copy_tree_r (tp, walk_subtrees, NULL);
1216 /* If EXPR has block defined, map it to newly constructed block.
1217 When inlining we want EXPRs without block appear in the block
1218 of function call if we are not remapping a type. */
1219 if (EXPR_P (*tp))
1221 new_block = id->remapping_type_depth == 0 ? id->block : NULL;
1222 if (TREE_BLOCK (*tp))
1224 tree *n;
1225 n = id->decl_map->get (TREE_BLOCK (*tp));
1226 if (n)
1227 new_block = *n;
1229 TREE_SET_BLOCK (*tp, new_block);
1232 if (TREE_CODE (*tp) != OMP_CLAUSE)
1233 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
1235 /* The copied TARGET_EXPR has never been expanded, even if the
1236 original node was expanded already. */
1237 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
1239 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
1240 TREE_OPERAND (*tp, 3) = NULL_TREE;
1243 /* Variable substitution need not be simple. In particular, the
1244 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1245 and friends are up-to-date. */
1246 else if (TREE_CODE (*tp) == ADDR_EXPR)
1248 int invariant = is_gimple_min_invariant (*tp);
1249 walk_tree (&TREE_OPERAND (*tp, 0), copy_tree_body_r, id, NULL);
1251 /* Handle the case where we substituted an INDIRECT_REF
1252 into the operand of the ADDR_EXPR. */
1253 if (TREE_CODE (TREE_OPERAND (*tp, 0)) == INDIRECT_REF)
1254 *tp = TREE_OPERAND (TREE_OPERAND (*tp, 0), 0);
1255 else
1256 recompute_tree_invariant_for_addr_expr (*tp);
1258 /* If this used to be invariant, but is not any longer,
1259 then regimplification is probably needed. */
1260 if (invariant && !is_gimple_min_invariant (*tp))
1261 id->regimplify = true;
1263 *walk_subtrees = 0;
1267 /* Keep iterating. */
1268 return NULL_TREE;
1271 /* Helper for remap_gimple_stmt. Given an EH region number for the
1272 source function, map that to the duplicate EH region number in
1273 the destination function. */
1275 static int
1276 remap_eh_region_nr (int old_nr, copy_body_data *id)
1278 eh_region old_r, new_r;
1280 old_r = get_eh_region_from_number_fn (id->src_cfun, old_nr);
1281 new_r = static_cast<eh_region> (*id->eh_map->get (old_r));
1283 return new_r->index;
1286 /* Similar, but operate on INTEGER_CSTs. */
1288 static tree
1289 remap_eh_region_tree_nr (tree old_t_nr, copy_body_data *id)
1291 int old_nr, new_nr;
1293 old_nr = tree_to_shwi (old_t_nr);
1294 new_nr = remap_eh_region_nr (old_nr, id);
1296 return build_int_cst (integer_type_node, new_nr);
1299 /* Helper for copy_bb. Remap statement STMT using the inlining
1300 information in ID. Return the new statement copy. */
1302 static gimple_seq
1303 remap_gimple_stmt (gimple stmt, copy_body_data *id)
1305 gimple copy = NULL;
1306 struct walk_stmt_info wi;
1307 bool skip_first = false;
1308 gimple_seq stmts = NULL;
1310 /* Begin by recognizing trees that we'll completely rewrite for the
1311 inlining context. Our output for these trees is completely
1312 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1313 into an edge). Further down, we'll handle trees that get
1314 duplicated and/or tweaked. */
1316 /* When requested, GIMPLE_RETURNs should be transformed to just the
1317 contained GIMPLE_ASSIGN. The branch semantics of the return will
1318 be handled elsewhere by manipulating the CFG rather than the
1319 statement. */
1320 if (gimple_code (stmt) == GIMPLE_RETURN && id->transform_return_to_modify)
1322 tree retval = gimple_return_retval (stmt);
1323 tree retbnd = gimple_return_retbnd (stmt);
1324 tree bndslot = id->retbnd;
1326 if (retbnd && bndslot)
1328 gimple bndcopy = gimple_build_assign (bndslot, retbnd);
1329 memset (&wi, 0, sizeof (wi));
1330 wi.info = id;
1331 walk_gimple_op (bndcopy, remap_gimple_op_r, &wi);
1332 gimple_seq_add_stmt (&stmts, bndcopy);
1335 /* If we're returning something, just turn that into an
1336 assignment into the equivalent of the original RESULT_DECL.
1337 If RETVAL is just the result decl, the result decl has
1338 already been set (e.g. a recent "foo (&result_decl, ...)");
1339 just toss the entire GIMPLE_RETURN. */
1340 if (retval
1341 && (TREE_CODE (retval) != RESULT_DECL
1342 && (TREE_CODE (retval) != SSA_NAME
1343 || ! SSA_NAME_VAR (retval)
1344 || TREE_CODE (SSA_NAME_VAR (retval)) != RESULT_DECL)))
1346 copy = gimple_build_assign (id->do_not_unshare
1347 ? id->retvar : unshare_expr (id->retvar),
1348 retval);
1349 /* id->retvar is already substituted. Skip it on later remapping. */
1350 skip_first = true;
1352 /* We need to copy bounds if return structure with pointers into
1353 instrumented function. */
1354 if (chkp_function_instrumented_p (id->dst_fn)
1355 && !bndslot
1356 && !BOUNDED_P (id->retvar)
1357 && chkp_type_has_pointer (TREE_TYPE (id->retvar)))
1358 id->assign_stmts.safe_push (copy);
1361 else
1362 return stmts;
1364 else if (gimple_has_substatements (stmt))
1366 gimple_seq s1, s2;
1368 /* When cloning bodies from the C++ front end, we will be handed bodies
1369 in High GIMPLE form. Handle here all the High GIMPLE statements that
1370 have embedded statements. */
1371 switch (gimple_code (stmt))
1373 case GIMPLE_BIND:
1374 copy = copy_gimple_bind (stmt, id);
1375 break;
1377 case GIMPLE_CATCH:
1378 s1 = remap_gimple_seq (gimple_catch_handler (stmt), id);
1379 copy = gimple_build_catch (gimple_catch_types (stmt), s1);
1380 break;
1382 case GIMPLE_EH_FILTER:
1383 s1 = remap_gimple_seq (gimple_eh_filter_failure (stmt), id);
1384 copy = gimple_build_eh_filter (gimple_eh_filter_types (stmt), s1);
1385 break;
1387 case GIMPLE_TRY:
1388 s1 = remap_gimple_seq (gimple_try_eval (stmt), id);
1389 s2 = remap_gimple_seq (gimple_try_cleanup (stmt), id);
1390 copy = gimple_build_try (s1, s2, gimple_try_kind (stmt));
1391 break;
1393 case GIMPLE_WITH_CLEANUP_EXPR:
1394 s1 = remap_gimple_seq (gimple_wce_cleanup (stmt), id);
1395 copy = gimple_build_wce (s1);
1396 break;
1398 case GIMPLE_OMP_PARALLEL:
1399 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1400 copy = gimple_build_omp_parallel
1401 (s1,
1402 gimple_omp_parallel_clauses (stmt),
1403 gimple_omp_parallel_child_fn (stmt),
1404 gimple_omp_parallel_data_arg (stmt));
1405 break;
1407 case GIMPLE_OMP_TASK:
1408 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1409 copy = gimple_build_omp_task
1410 (s1,
1411 gimple_omp_task_clauses (stmt),
1412 gimple_omp_task_child_fn (stmt),
1413 gimple_omp_task_data_arg (stmt),
1414 gimple_omp_task_copy_fn (stmt),
1415 gimple_omp_task_arg_size (stmt),
1416 gimple_omp_task_arg_align (stmt));
1417 break;
1419 case GIMPLE_OMP_FOR:
1420 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1421 s2 = remap_gimple_seq (gimple_omp_for_pre_body (stmt), id);
1422 copy = gimple_build_omp_for (s1, gimple_omp_for_kind (stmt),
1423 gimple_omp_for_clauses (stmt),
1424 gimple_omp_for_collapse (stmt), s2);
1426 size_t i;
1427 for (i = 0; i < gimple_omp_for_collapse (stmt); i++)
1429 gimple_omp_for_set_index (copy, i,
1430 gimple_omp_for_index (stmt, i));
1431 gimple_omp_for_set_initial (copy, i,
1432 gimple_omp_for_initial (stmt, i));
1433 gimple_omp_for_set_final (copy, i,
1434 gimple_omp_for_final (stmt, i));
1435 gimple_omp_for_set_incr (copy, i,
1436 gimple_omp_for_incr (stmt, i));
1437 gimple_omp_for_set_cond (copy, i,
1438 gimple_omp_for_cond (stmt, i));
1441 break;
1443 case GIMPLE_OMP_MASTER:
1444 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1445 copy = gimple_build_omp_master (s1);
1446 break;
1448 case GIMPLE_OMP_TASKGROUP:
1449 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1450 copy = gimple_build_omp_taskgroup (s1);
1451 break;
1453 case GIMPLE_OMP_ORDERED:
1454 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1455 copy = gimple_build_omp_ordered (s1);
1456 break;
1458 case GIMPLE_OMP_SECTION:
1459 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1460 copy = gimple_build_omp_section (s1);
1461 break;
1463 case GIMPLE_OMP_SECTIONS:
1464 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1465 copy = gimple_build_omp_sections
1466 (s1, gimple_omp_sections_clauses (stmt));
1467 break;
1469 case GIMPLE_OMP_SINGLE:
1470 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1471 copy = gimple_build_omp_single
1472 (s1, gimple_omp_single_clauses (stmt));
1473 break;
1475 case GIMPLE_OMP_TARGET:
1476 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1477 copy = gimple_build_omp_target
1478 (s1, gimple_omp_target_kind (stmt),
1479 gimple_omp_target_clauses (stmt));
1480 break;
1482 case GIMPLE_OMP_TEAMS:
1483 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1484 copy = gimple_build_omp_teams
1485 (s1, gimple_omp_teams_clauses (stmt));
1486 break;
1488 case GIMPLE_OMP_CRITICAL:
1489 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1490 copy
1491 = gimple_build_omp_critical (s1, gimple_omp_critical_name (stmt));
1492 break;
1494 case GIMPLE_TRANSACTION:
1495 s1 = remap_gimple_seq (gimple_transaction_body (stmt), id);
1496 copy = gimple_build_transaction (s1, gimple_transaction_label (stmt));
1497 gimple_transaction_set_subcode (copy, gimple_transaction_subcode (stmt));
1498 break;
1500 default:
1501 gcc_unreachable ();
1504 else
1506 if (gimple_assign_copy_p (stmt)
1507 && gimple_assign_lhs (stmt) == gimple_assign_rhs1 (stmt)
1508 && auto_var_in_fn_p (gimple_assign_lhs (stmt), id->src_fn))
1510 /* Here we handle statements that are not completely rewritten.
1511 First we detect some inlining-induced bogosities for
1512 discarding. */
1514 /* Some assignments VAR = VAR; don't generate any rtl code
1515 and thus don't count as variable modification. Avoid
1516 keeping bogosities like 0 = 0. */
1517 tree decl = gimple_assign_lhs (stmt), value;
1518 tree *n;
1520 n = id->decl_map->get (decl);
1521 if (n)
1523 value = *n;
1524 STRIP_TYPE_NOPS (value);
1525 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1526 return NULL;
1530 /* For *ptr_N ={v} {CLOBBER}, if ptr_N is SSA_NAME defined
1531 in a block that we aren't copying during tree_function_versioning,
1532 just drop the clobber stmt. */
1533 if (id->blocks_to_copy && gimple_clobber_p (stmt))
1535 tree lhs = gimple_assign_lhs (stmt);
1536 if (TREE_CODE (lhs) == MEM_REF
1537 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
1539 gimple def_stmt = SSA_NAME_DEF_STMT (TREE_OPERAND (lhs, 0));
1540 if (gimple_bb (def_stmt)
1541 && !bitmap_bit_p (id->blocks_to_copy,
1542 gimple_bb (def_stmt)->index))
1543 return NULL;
1547 if (gimple_debug_bind_p (stmt))
1549 copy = gimple_build_debug_bind (gimple_debug_bind_get_var (stmt),
1550 gimple_debug_bind_get_value (stmt),
1551 stmt);
1552 id->debug_stmts.safe_push (copy);
1553 gimple_seq_add_stmt (&stmts, copy);
1554 return stmts;
1556 if (gimple_debug_source_bind_p (stmt))
1558 copy = gimple_build_debug_source_bind
1559 (gimple_debug_source_bind_get_var (stmt),
1560 gimple_debug_source_bind_get_value (stmt), stmt);
1561 id->debug_stmts.safe_push (copy);
1562 gimple_seq_add_stmt (&stmts, copy);
1563 return stmts;
1566 /* Create a new deep copy of the statement. */
1567 copy = gimple_copy (stmt);
1569 /* Clear flags that need revisiting. */
1570 if (is_gimple_call (copy)
1571 && gimple_call_tail_p (copy))
1572 gimple_call_set_tail (copy, false);
1574 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1575 RESX and EH_DISPATCH. */
1576 if (id->eh_map)
1577 switch (gimple_code (copy))
1579 case GIMPLE_CALL:
1581 tree r, fndecl = gimple_call_fndecl (copy);
1582 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
1583 switch (DECL_FUNCTION_CODE (fndecl))
1585 case BUILT_IN_EH_COPY_VALUES:
1586 r = gimple_call_arg (copy, 1);
1587 r = remap_eh_region_tree_nr (r, id);
1588 gimple_call_set_arg (copy, 1, r);
1589 /* FALLTHRU */
1591 case BUILT_IN_EH_POINTER:
1592 case BUILT_IN_EH_FILTER:
1593 r = gimple_call_arg (copy, 0);
1594 r = remap_eh_region_tree_nr (r, id);
1595 gimple_call_set_arg (copy, 0, r);
1596 break;
1598 default:
1599 break;
1602 /* Reset alias info if we didn't apply measures to
1603 keep it valid over inlining by setting DECL_PT_UID. */
1604 if (!id->src_cfun->gimple_df
1605 || !id->src_cfun->gimple_df->ipa_pta)
1606 gimple_call_reset_alias_info (copy);
1608 break;
1610 case GIMPLE_RESX:
1612 int r = gimple_resx_region (copy);
1613 r = remap_eh_region_nr (r, id);
1614 gimple_resx_set_region (copy, r);
1616 break;
1618 case GIMPLE_EH_DISPATCH:
1620 int r = gimple_eh_dispatch_region (copy);
1621 r = remap_eh_region_nr (r, id);
1622 gimple_eh_dispatch_set_region (copy, r);
1624 break;
1626 default:
1627 break;
1631 /* If STMT has a block defined, map it to the newly constructed
1632 block. */
1633 if (gimple_block (copy))
1635 tree *n;
1636 n = id->decl_map->get (gimple_block (copy));
1637 gcc_assert (n);
1638 gimple_set_block (copy, *n);
1641 if (gimple_debug_bind_p (copy) || gimple_debug_source_bind_p (copy))
1643 gimple_seq_add_stmt (&stmts, copy);
1644 return stmts;
1647 /* Remap all the operands in COPY. */
1648 memset (&wi, 0, sizeof (wi));
1649 wi.info = id;
1650 if (skip_first)
1651 walk_tree (gimple_op_ptr (copy, 1), remap_gimple_op_r, &wi, NULL);
1652 else
1653 walk_gimple_op (copy, remap_gimple_op_r, &wi);
1655 /* Clear the copied virtual operands. We are not remapping them here
1656 but are going to recreate them from scratch. */
1657 if (gimple_has_mem_ops (copy))
1659 gimple_set_vdef (copy, NULL_TREE);
1660 gimple_set_vuse (copy, NULL_TREE);
1663 gimple_seq_add_stmt (&stmts, copy);
1664 return stmts;
1668 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1669 later */
1671 static basic_block
1672 copy_bb (copy_body_data *id, basic_block bb, int frequency_scale,
1673 gcov_type count_scale)
1675 gimple_stmt_iterator gsi, copy_gsi, seq_gsi;
1676 basic_block copy_basic_block;
1677 tree decl;
1678 gcov_type freq;
1679 basic_block prev;
1681 /* Search for previous copied basic block. */
1682 prev = bb->prev_bb;
1683 while (!prev->aux)
1684 prev = prev->prev_bb;
1686 /* create_basic_block() will append every new block to
1687 basic_block_info automatically. */
1688 copy_basic_block = create_basic_block (NULL, (void *) 0,
1689 (basic_block) prev->aux);
1690 copy_basic_block->count = apply_scale (bb->count, count_scale);
1692 /* We are going to rebuild frequencies from scratch. These values
1693 have just small importance to drive canonicalize_loop_headers. */
1694 freq = apply_scale ((gcov_type)bb->frequency, frequency_scale);
1696 /* We recompute frequencies after inlining, so this is quite safe. */
1697 if (freq > BB_FREQ_MAX)
1698 freq = BB_FREQ_MAX;
1699 copy_basic_block->frequency = freq;
1701 copy_gsi = gsi_start_bb (copy_basic_block);
1703 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1705 gimple_seq stmts;
1706 gimple stmt = gsi_stmt (gsi);
1707 gimple orig_stmt = stmt;
1708 gimple_stmt_iterator stmts_gsi;
1709 bool stmt_added = false;
1711 id->regimplify = false;
1712 stmts = remap_gimple_stmt (stmt, id);
1714 if (gimple_seq_empty_p (stmts))
1715 continue;
1717 seq_gsi = copy_gsi;
1719 for (stmts_gsi = gsi_start (stmts);
1720 !gsi_end_p (stmts_gsi); )
1722 stmt = gsi_stmt (stmts_gsi);
1724 /* Advance iterator now before stmt is moved to seq_gsi. */
1725 gsi_next (&stmts_gsi);
1727 if (gimple_nop_p (stmt))
1728 continue;
1730 gimple_duplicate_stmt_histograms (cfun, stmt, id->src_cfun,
1731 orig_stmt);
1733 /* With return slot optimization we can end up with
1734 non-gimple (foo *)&this->m, fix that here. */
1735 if (is_gimple_assign (stmt)
1736 && CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt))
1737 && !is_gimple_val (gimple_assign_rhs1 (stmt)))
1739 tree new_rhs;
1740 new_rhs = force_gimple_operand_gsi (&seq_gsi,
1741 gimple_assign_rhs1 (stmt),
1742 true, NULL, false,
1743 GSI_CONTINUE_LINKING);
1744 gimple_assign_set_rhs1 (stmt, new_rhs);
1745 id->regimplify = false;
1748 gsi_insert_after (&seq_gsi, stmt, GSI_NEW_STMT);
1750 if (id->regimplify)
1751 gimple_regimplify_operands (stmt, &seq_gsi);
1753 stmt_added = true;
1756 if (!stmt_added)
1757 continue;
1759 /* If copy_basic_block has been empty at the start of this iteration,
1760 call gsi_start_bb again to get at the newly added statements. */
1761 if (gsi_end_p (copy_gsi))
1762 copy_gsi = gsi_start_bb (copy_basic_block);
1763 else
1764 gsi_next (&copy_gsi);
1766 /* Process the new statement. The call to gimple_regimplify_operands
1767 possibly turned the statement into multiple statements, we
1768 need to process all of them. */
1771 tree fn;
1773 stmt = gsi_stmt (copy_gsi);
1774 if (is_gimple_call (stmt)
1775 && gimple_call_va_arg_pack_p (stmt)
1776 && id->gimple_call)
1778 /* __builtin_va_arg_pack () should be replaced by
1779 all arguments corresponding to ... in the caller. */
1780 tree p;
1781 gimple new_call;
1782 vec<tree> argarray;
1783 size_t nargs = gimple_call_num_args (id->gimple_call);
1784 size_t n, i, nargs_to_copy;
1785 bool remove_bounds = false;
1787 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1788 nargs--;
1790 /* Bounds should be removed from arg pack in case
1791 we handle not instrumented call in instrumented
1792 function. */
1793 nargs_to_copy = nargs;
1794 if (gimple_call_with_bounds_p (id->gimple_call)
1795 && !gimple_call_with_bounds_p (stmt))
1797 for (i = gimple_call_num_args (id->gimple_call) - nargs;
1798 i < gimple_call_num_args (id->gimple_call);
1799 i++)
1800 if (POINTER_BOUNDS_P (gimple_call_arg (id->gimple_call, i)))
1801 nargs_to_copy--;
1802 remove_bounds = true;
1805 /* Create the new array of arguments. */
1806 n = nargs_to_copy + gimple_call_num_args (stmt);
1807 argarray.create (n);
1808 argarray.safe_grow_cleared (n);
1810 /* Copy all the arguments before '...' */
1811 memcpy (argarray.address (),
1812 gimple_call_arg_ptr (stmt, 0),
1813 gimple_call_num_args (stmt) * sizeof (tree));
1815 if (remove_bounds)
1817 /* Append the rest of arguments removing bounds. */
1818 unsigned cur = gimple_call_num_args (stmt);
1819 i = gimple_call_num_args (id->gimple_call) - nargs;
1820 for (i = gimple_call_num_args (id->gimple_call) - nargs;
1821 i < gimple_call_num_args (id->gimple_call);
1822 i++)
1823 if (!POINTER_BOUNDS_P (gimple_call_arg (id->gimple_call, i)))
1824 argarray[cur++] = gimple_call_arg (id->gimple_call, i);
1825 gcc_assert (cur == n);
1827 else
1829 /* Append the arguments passed in '...' */
1830 memcpy (argarray.address () + gimple_call_num_args (stmt),
1831 gimple_call_arg_ptr (id->gimple_call, 0)
1832 + (gimple_call_num_args (id->gimple_call) - nargs),
1833 nargs * sizeof (tree));
1836 new_call = gimple_build_call_vec (gimple_call_fn (stmt),
1837 argarray);
1839 argarray.release ();
1841 /* Copy all GIMPLE_CALL flags, location and block, except
1842 GF_CALL_VA_ARG_PACK. */
1843 gimple_call_copy_flags (new_call, stmt);
1844 gimple_call_set_va_arg_pack (new_call, false);
1845 gimple_set_location (new_call, gimple_location (stmt));
1846 gimple_set_block (new_call, gimple_block (stmt));
1847 gimple_call_set_lhs (new_call, gimple_call_lhs (stmt));
1849 gsi_replace (&copy_gsi, new_call, false);
1850 stmt = new_call;
1852 else if (is_gimple_call (stmt)
1853 && id->gimple_call
1854 && (decl = gimple_call_fndecl (stmt))
1855 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
1856 && DECL_FUNCTION_CODE (decl) == BUILT_IN_VA_ARG_PACK_LEN)
1858 /* __builtin_va_arg_pack_len () should be replaced by
1859 the number of anonymous arguments. */
1860 size_t nargs = gimple_call_num_args (id->gimple_call), i;
1861 tree count, p;
1862 gimple new_stmt;
1864 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1865 nargs--;
1867 /* For instrumented calls we should ignore bounds. */
1868 for (i = gimple_call_num_args (id->gimple_call) - nargs;
1869 i < gimple_call_num_args (id->gimple_call);
1870 i++)
1871 if (POINTER_BOUNDS_P (gimple_call_arg (id->gimple_call, i)))
1872 nargs--;
1874 count = build_int_cst (integer_type_node, nargs);
1875 new_stmt = gimple_build_assign (gimple_call_lhs (stmt), count);
1876 gsi_replace (&copy_gsi, new_stmt, false);
1877 stmt = new_stmt;
1880 /* Statements produced by inlining can be unfolded, especially
1881 when we constant propagated some operands. We can't fold
1882 them right now for two reasons:
1883 1) folding require SSA_NAME_DEF_STMTs to be correct
1884 2) we can't change function calls to builtins.
1885 So we just mark statement for later folding. We mark
1886 all new statements, instead just statements that has changed
1887 by some nontrivial substitution so even statements made
1888 foldable indirectly are updated. If this turns out to be
1889 expensive, copy_body can be told to watch for nontrivial
1890 changes. */
1891 if (id->statements_to_fold)
1892 id->statements_to_fold->add (stmt);
1894 /* We're duplicating a CALL_EXPR. Find any corresponding
1895 callgraph edges and update or duplicate them. */
1896 if (is_gimple_call (stmt))
1898 struct cgraph_edge *edge;
1900 switch (id->transform_call_graph_edges)
1902 case CB_CGE_DUPLICATE:
1903 edge = id->src_node->get_edge (orig_stmt);
1904 if (edge)
1906 int edge_freq = edge->frequency;
1907 int new_freq;
1908 struct cgraph_edge *old_edge = edge;
1909 edge = edge->clone (id->dst_node, stmt,
1910 gimple_uid (stmt),
1911 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1912 true);
1913 /* We could also just rescale the frequency, but
1914 doing so would introduce roundoff errors and make
1915 verifier unhappy. */
1916 new_freq = compute_call_stmt_bb_frequency (id->dst_node->decl,
1917 copy_basic_block);
1919 /* Speculative calls consist of two edges - direct and indirect.
1920 Duplicate the whole thing and distribute frequencies accordingly. */
1921 if (edge->speculative)
1923 struct cgraph_edge *direct, *indirect;
1924 struct ipa_ref *ref;
1926 gcc_assert (!edge->indirect_unknown_callee);
1927 old_edge->speculative_call_info (direct, indirect, ref);
1928 indirect = indirect->clone (id->dst_node, stmt,
1929 gimple_uid (stmt),
1930 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1931 true);
1932 if (old_edge->frequency + indirect->frequency)
1934 edge->frequency = MIN (RDIV ((gcov_type)new_freq * old_edge->frequency,
1935 (old_edge->frequency + indirect->frequency)),
1936 CGRAPH_FREQ_MAX);
1937 indirect->frequency = MIN (RDIV ((gcov_type)new_freq * indirect->frequency,
1938 (old_edge->frequency + indirect->frequency)),
1939 CGRAPH_FREQ_MAX);
1941 id->dst_node->clone_reference (ref, stmt);
1943 else
1945 edge->frequency = new_freq;
1946 if (dump_file
1947 && profile_status_for_fn (cfun) != PROFILE_ABSENT
1948 && (edge_freq > edge->frequency + 10
1949 || edge_freq < edge->frequency - 10))
1951 fprintf (dump_file, "Edge frequency estimated by "
1952 "cgraph %i diverge from inliner's estimate %i\n",
1953 edge_freq,
1954 edge->frequency);
1955 fprintf (dump_file,
1956 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1957 bb->index,
1958 bb->frequency,
1959 copy_basic_block->frequency);
1963 break;
1965 case CB_CGE_MOVE_CLONES:
1966 id->dst_node->set_call_stmt_including_clones (orig_stmt,
1967 stmt);
1968 edge = id->dst_node->get_edge (stmt);
1969 break;
1971 case CB_CGE_MOVE:
1972 edge = id->dst_node->get_edge (orig_stmt);
1973 if (edge)
1974 edge->set_call_stmt (stmt);
1975 break;
1977 default:
1978 gcc_unreachable ();
1981 /* Constant propagation on argument done during inlining
1982 may create new direct call. Produce an edge for it. */
1983 if ((!edge
1984 || (edge->indirect_inlining_edge
1985 && id->transform_call_graph_edges == CB_CGE_MOVE_CLONES))
1986 && id->dst_node->definition
1987 && (fn = gimple_call_fndecl (stmt)) != NULL)
1989 struct cgraph_node *dest = cgraph_node::get (fn);
1991 /* We have missing edge in the callgraph. This can happen
1992 when previous inlining turned an indirect call into a
1993 direct call by constant propagating arguments or we are
1994 producing dead clone (for further cloning). In all
1995 other cases we hit a bug (incorrect node sharing is the
1996 most common reason for missing edges). */
1997 gcc_assert (!dest->definition
1998 || dest->address_taken
1999 || !id->src_node->definition
2000 || !id->dst_node->definition);
2001 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES)
2002 id->dst_node->create_edge_including_clones
2003 (dest, orig_stmt, stmt, bb->count,
2004 compute_call_stmt_bb_frequency (id->dst_node->decl,
2005 copy_basic_block),
2006 CIF_ORIGINALLY_INDIRECT_CALL);
2007 else
2008 id->dst_node->create_edge (dest, stmt,
2009 bb->count,
2010 compute_call_stmt_bb_frequency
2011 (id->dst_node->decl,
2012 copy_basic_block))->inline_failed
2013 = CIF_ORIGINALLY_INDIRECT_CALL;
2014 if (dump_file)
2016 fprintf (dump_file, "Created new direct edge to %s\n",
2017 dest->name ());
2021 notice_special_calls (stmt);
2024 maybe_duplicate_eh_stmt_fn (cfun, stmt, id->src_cfun, orig_stmt,
2025 id->eh_map, id->eh_lp_nr);
2027 if (gimple_in_ssa_p (cfun) && !is_gimple_debug (stmt))
2029 ssa_op_iter i;
2030 tree def;
2032 FOR_EACH_SSA_TREE_OPERAND (def, stmt, i, SSA_OP_DEF)
2033 if (TREE_CODE (def) == SSA_NAME)
2034 SSA_NAME_DEF_STMT (def) = stmt;
2037 gsi_next (&copy_gsi);
2039 while (!gsi_end_p (copy_gsi));
2041 copy_gsi = gsi_last_bb (copy_basic_block);
2044 return copy_basic_block;
2047 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
2048 form is quite easy, since dominator relationship for old basic blocks does
2049 not change.
2051 There is however exception where inlining might change dominator relation
2052 across EH edges from basic block within inlined functions destinating
2053 to landing pads in function we inline into.
2055 The function fills in PHI_RESULTs of such PHI nodes if they refer
2056 to gimple regs. Otherwise, the function mark PHI_RESULT of such
2057 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
2058 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
2059 set, and this means that there will be no overlapping live ranges
2060 for the underlying symbol.
2062 This might change in future if we allow redirecting of EH edges and
2063 we might want to change way build CFG pre-inlining to include
2064 all the possible edges then. */
2065 static void
2066 update_ssa_across_abnormal_edges (basic_block bb, basic_block ret_bb,
2067 bool can_throw, bool nonlocal_goto)
2069 edge e;
2070 edge_iterator ei;
2072 FOR_EACH_EDGE (e, ei, bb->succs)
2073 if (!e->dest->aux
2074 || ((basic_block)e->dest->aux)->index == ENTRY_BLOCK)
2076 gimple phi;
2077 gimple_stmt_iterator si;
2079 if (!nonlocal_goto)
2080 gcc_assert (e->flags & EDGE_EH);
2082 if (!can_throw)
2083 gcc_assert (!(e->flags & EDGE_EH));
2085 for (si = gsi_start_phis (e->dest); !gsi_end_p (si); gsi_next (&si))
2087 edge re;
2089 phi = gsi_stmt (si);
2091 /* For abnormal goto/call edges the receiver can be the
2092 ENTRY_BLOCK. Do not assert this cannot happen. */
2094 gcc_assert ((e->flags & EDGE_EH)
2095 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi)));
2097 re = find_edge (ret_bb, e->dest);
2098 gcc_checking_assert (re);
2099 gcc_assert ((re->flags & (EDGE_EH | EDGE_ABNORMAL))
2100 == (e->flags & (EDGE_EH | EDGE_ABNORMAL)));
2102 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi, e),
2103 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi, re)));
2109 /* Copy edges from BB into its copy constructed earlier, scale profile
2110 accordingly. Edges will be taken care of later. Assume aux
2111 pointers to point to the copies of each BB. Return true if any
2112 debug stmts are left after a statement that must end the basic block. */
2114 static bool
2115 copy_edges_for_bb (basic_block bb, gcov_type count_scale, basic_block ret_bb,
2116 basic_block abnormal_goto_dest)
2118 basic_block new_bb = (basic_block) bb->aux;
2119 edge_iterator ei;
2120 edge old_edge;
2121 gimple_stmt_iterator si;
2122 int flags;
2123 bool need_debug_cleanup = false;
2125 /* Use the indices from the original blocks to create edges for the
2126 new ones. */
2127 FOR_EACH_EDGE (old_edge, ei, bb->succs)
2128 if (!(old_edge->flags & EDGE_EH))
2130 edge new_edge;
2132 flags = old_edge->flags;
2134 /* Return edges do get a FALLTHRU flag when the get inlined. */
2135 if (old_edge->dest->index == EXIT_BLOCK
2136 && !(old_edge->flags & (EDGE_TRUE_VALUE|EDGE_FALSE_VALUE|EDGE_FAKE))
2137 && old_edge->dest->aux != EXIT_BLOCK_PTR_FOR_FN (cfun))
2138 flags |= EDGE_FALLTHRU;
2139 new_edge = make_edge (new_bb, (basic_block) old_edge->dest->aux, flags);
2140 new_edge->count = apply_scale (old_edge->count, count_scale);
2141 new_edge->probability = old_edge->probability;
2144 if (bb->index == ENTRY_BLOCK || bb->index == EXIT_BLOCK)
2145 return false;
2147 for (si = gsi_start_bb (new_bb); !gsi_end_p (si);)
2149 gimple copy_stmt;
2150 bool can_throw, nonlocal_goto;
2152 copy_stmt = gsi_stmt (si);
2153 if (!is_gimple_debug (copy_stmt))
2154 update_stmt (copy_stmt);
2156 /* Do this before the possible split_block. */
2157 gsi_next (&si);
2159 /* If this tree could throw an exception, there are two
2160 cases where we need to add abnormal edge(s): the
2161 tree wasn't in a region and there is a "current
2162 region" in the caller; or the original tree had
2163 EH edges. In both cases split the block after the tree,
2164 and add abnormal edge(s) as needed; we need both
2165 those from the callee and the caller.
2166 We check whether the copy can throw, because the const
2167 propagation can change an INDIRECT_REF which throws
2168 into a COMPONENT_REF which doesn't. If the copy
2169 can throw, the original could also throw. */
2170 can_throw = stmt_can_throw_internal (copy_stmt);
2171 nonlocal_goto
2172 = (stmt_can_make_abnormal_goto (copy_stmt)
2173 && !computed_goto_p (copy_stmt));
2175 if (can_throw || nonlocal_goto)
2177 if (!gsi_end_p (si))
2179 while (!gsi_end_p (si) && is_gimple_debug (gsi_stmt (si)))
2180 gsi_next (&si);
2181 if (gsi_end_p (si))
2182 need_debug_cleanup = true;
2184 if (!gsi_end_p (si))
2185 /* Note that bb's predecessor edges aren't necessarily
2186 right at this point; split_block doesn't care. */
2188 edge e = split_block (new_bb, copy_stmt);
2190 new_bb = e->dest;
2191 new_bb->aux = e->src->aux;
2192 si = gsi_start_bb (new_bb);
2196 if (gimple_code (copy_stmt) == GIMPLE_EH_DISPATCH)
2197 make_eh_dispatch_edges (copy_stmt);
2198 else if (can_throw)
2199 make_eh_edges (copy_stmt);
2201 /* If the call we inline cannot make abnormal goto do not add
2202 additional abnormal edges but only retain those already present
2203 in the original function body. */
2204 if (abnormal_goto_dest == NULL)
2205 nonlocal_goto = false;
2206 if (nonlocal_goto)
2208 basic_block copy_stmt_bb = gimple_bb (copy_stmt);
2210 if (get_abnormal_succ_dispatcher (copy_stmt_bb))
2211 nonlocal_goto = false;
2212 /* ABNORMAL_DISPATCHER (1) is for longjmp/setjmp or nonlocal gotos
2213 in OpenMP regions which aren't allowed to be left abnormally.
2214 So, no need to add abnormal edge in that case. */
2215 else if (is_gimple_call (copy_stmt)
2216 && gimple_call_internal_p (copy_stmt)
2217 && (gimple_call_internal_fn (copy_stmt)
2218 == IFN_ABNORMAL_DISPATCHER)
2219 && gimple_call_arg (copy_stmt, 0) == boolean_true_node)
2220 nonlocal_goto = false;
2221 else
2222 make_edge (copy_stmt_bb, abnormal_goto_dest, EDGE_ABNORMAL);
2225 if ((can_throw || nonlocal_goto)
2226 && gimple_in_ssa_p (cfun))
2227 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt), ret_bb,
2228 can_throw, nonlocal_goto);
2230 return need_debug_cleanup;
2233 /* Copy the PHIs. All blocks and edges are copied, some blocks
2234 was possibly split and new outgoing EH edges inserted.
2235 BB points to the block of original function and AUX pointers links
2236 the original and newly copied blocks. */
2238 static void
2239 copy_phis_for_bb (basic_block bb, copy_body_data *id)
2241 basic_block const new_bb = (basic_block) bb->aux;
2242 edge_iterator ei;
2243 gimple phi;
2244 gimple_stmt_iterator si;
2245 edge new_edge;
2246 bool inserted = false;
2248 for (si = gsi_start_phis (bb); !gsi_end_p (si); gsi_next (&si))
2250 tree res, new_res;
2251 gimple new_phi;
2253 phi = gsi_stmt (si);
2254 res = PHI_RESULT (phi);
2255 new_res = res;
2256 if (!virtual_operand_p (res))
2258 walk_tree (&new_res, copy_tree_body_r, id, NULL);
2259 new_phi = create_phi_node (new_res, new_bb);
2260 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2262 edge old_edge = find_edge ((basic_block) new_edge->src->aux, bb);
2263 tree arg;
2264 tree new_arg;
2265 edge_iterator ei2;
2266 location_t locus;
2268 /* When doing partial cloning, we allow PHIs on the entry block
2269 as long as all the arguments are the same. Find any input
2270 edge to see argument to copy. */
2271 if (!old_edge)
2272 FOR_EACH_EDGE (old_edge, ei2, bb->preds)
2273 if (!old_edge->src->aux)
2274 break;
2276 arg = PHI_ARG_DEF_FROM_EDGE (phi, old_edge);
2277 new_arg = arg;
2278 walk_tree (&new_arg, copy_tree_body_r, id, NULL);
2279 gcc_assert (new_arg);
2280 /* With return slot optimization we can end up with
2281 non-gimple (foo *)&this->m, fix that here. */
2282 if (TREE_CODE (new_arg) != SSA_NAME
2283 && TREE_CODE (new_arg) != FUNCTION_DECL
2284 && !is_gimple_val (new_arg))
2286 gimple_seq stmts = NULL;
2287 new_arg = force_gimple_operand (new_arg, &stmts, true, NULL);
2288 gsi_insert_seq_on_edge (new_edge, stmts);
2289 inserted = true;
2291 locus = gimple_phi_arg_location_from_edge (phi, old_edge);
2292 if (LOCATION_BLOCK (locus))
2294 tree *n;
2295 n = id->decl_map->get (LOCATION_BLOCK (locus));
2296 gcc_assert (n);
2297 if (*n)
2298 locus = COMBINE_LOCATION_DATA (line_table, locus, *n);
2299 else
2300 locus = LOCATION_LOCUS (locus);
2302 else
2303 locus = LOCATION_LOCUS (locus);
2305 add_phi_arg (new_phi, new_arg, new_edge, locus);
2310 /* Commit the delayed edge insertions. */
2311 if (inserted)
2312 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2313 gsi_commit_one_edge_insert (new_edge, NULL);
2317 /* Wrapper for remap_decl so it can be used as a callback. */
2319 static tree
2320 remap_decl_1 (tree decl, void *data)
2322 return remap_decl (decl, (copy_body_data *) data);
2325 /* Build struct function and associated datastructures for the new clone
2326 NEW_FNDECL to be build. CALLEE_FNDECL is the original. Function changes
2327 the cfun to the function of new_fndecl (and current_function_decl too). */
2329 static void
2330 initialize_cfun (tree new_fndecl, tree callee_fndecl, gcov_type count)
2332 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2333 gcov_type count_scale;
2335 if (!DECL_ARGUMENTS (new_fndecl))
2336 DECL_ARGUMENTS (new_fndecl) = DECL_ARGUMENTS (callee_fndecl);
2337 if (!DECL_RESULT (new_fndecl))
2338 DECL_RESULT (new_fndecl) = DECL_RESULT (callee_fndecl);
2340 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2341 count_scale
2342 = GCOV_COMPUTE_SCALE (count,
2343 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2344 else
2345 count_scale = REG_BR_PROB_BASE;
2347 /* Register specific tree functions. */
2348 gimple_register_cfg_hooks ();
2350 /* Get clean struct function. */
2351 push_struct_function (new_fndecl);
2353 /* We will rebuild these, so just sanity check that they are empty. */
2354 gcc_assert (VALUE_HISTOGRAMS (cfun) == NULL);
2355 gcc_assert (cfun->local_decls == NULL);
2356 gcc_assert (cfun->cfg == NULL);
2357 gcc_assert (cfun->decl == new_fndecl);
2359 /* Copy items we preserve during cloning. */
2360 cfun->static_chain_decl = src_cfun->static_chain_decl;
2361 cfun->nonlocal_goto_save_area = src_cfun->nonlocal_goto_save_area;
2362 cfun->function_end_locus = src_cfun->function_end_locus;
2363 cfun->curr_properties = src_cfun->curr_properties;
2364 cfun->last_verified = src_cfun->last_verified;
2365 cfun->va_list_gpr_size = src_cfun->va_list_gpr_size;
2366 cfun->va_list_fpr_size = src_cfun->va_list_fpr_size;
2367 cfun->has_nonlocal_label = src_cfun->has_nonlocal_label;
2368 cfun->stdarg = src_cfun->stdarg;
2369 cfun->after_inlining = src_cfun->after_inlining;
2370 cfun->can_throw_non_call_exceptions
2371 = src_cfun->can_throw_non_call_exceptions;
2372 cfun->can_delete_dead_exceptions = src_cfun->can_delete_dead_exceptions;
2373 cfun->returns_struct = src_cfun->returns_struct;
2374 cfun->returns_pcc_struct = src_cfun->returns_pcc_struct;
2376 init_empty_tree_cfg ();
2378 profile_status_for_fn (cfun) = profile_status_for_fn (src_cfun);
2379 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count =
2380 (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2381 REG_BR_PROB_BASE);
2382 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency
2383 = ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2384 EXIT_BLOCK_PTR_FOR_FN (cfun)->count =
2385 (EXIT_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2386 REG_BR_PROB_BASE);
2387 EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency =
2388 EXIT_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2389 if (src_cfun->eh)
2390 init_eh_for_function ();
2392 if (src_cfun->gimple_df)
2394 init_tree_ssa (cfun);
2395 cfun->gimple_df->in_ssa_p = true;
2396 init_ssa_operands (cfun);
2400 /* Helper function for copy_cfg_body. Move debug stmts from the end
2401 of NEW_BB to the beginning of successor basic blocks when needed. If the
2402 successor has multiple predecessors, reset them, otherwise keep
2403 their value. */
2405 static void
2406 maybe_move_debug_stmts_to_successors (copy_body_data *id, basic_block new_bb)
2408 edge e;
2409 edge_iterator ei;
2410 gimple_stmt_iterator si = gsi_last_nondebug_bb (new_bb);
2412 if (gsi_end_p (si)
2413 || gsi_one_before_end_p (si)
2414 || !(stmt_can_throw_internal (gsi_stmt (si))
2415 || stmt_can_make_abnormal_goto (gsi_stmt (si))))
2416 return;
2418 FOR_EACH_EDGE (e, ei, new_bb->succs)
2420 gimple_stmt_iterator ssi = gsi_last_bb (new_bb);
2421 gimple_stmt_iterator dsi = gsi_after_labels (e->dest);
2422 while (is_gimple_debug (gsi_stmt (ssi)))
2424 gimple stmt = gsi_stmt (ssi), new_stmt;
2425 tree var;
2426 tree value;
2428 /* For the last edge move the debug stmts instead of copying
2429 them. */
2430 if (ei_one_before_end_p (ei))
2432 si = ssi;
2433 gsi_prev (&ssi);
2434 if (!single_pred_p (e->dest) && gimple_debug_bind_p (stmt))
2435 gimple_debug_bind_reset_value (stmt);
2436 gsi_remove (&si, false);
2437 gsi_insert_before (&dsi, stmt, GSI_SAME_STMT);
2438 continue;
2441 if (gimple_debug_bind_p (stmt))
2443 var = gimple_debug_bind_get_var (stmt);
2444 if (single_pred_p (e->dest))
2446 value = gimple_debug_bind_get_value (stmt);
2447 value = unshare_expr (value);
2449 else
2450 value = NULL_TREE;
2451 new_stmt = gimple_build_debug_bind (var, value, stmt);
2453 else if (gimple_debug_source_bind_p (stmt))
2455 var = gimple_debug_source_bind_get_var (stmt);
2456 value = gimple_debug_source_bind_get_value (stmt);
2457 new_stmt = gimple_build_debug_source_bind (var, value, stmt);
2459 else
2460 gcc_unreachable ();
2461 gsi_insert_before (&dsi, new_stmt, GSI_SAME_STMT);
2462 id->debug_stmts.safe_push (new_stmt);
2463 gsi_prev (&ssi);
2468 /* Make a copy of the sub-loops of SRC_PARENT and place them
2469 as siblings of DEST_PARENT. */
2471 static void
2472 copy_loops (copy_body_data *id,
2473 struct loop *dest_parent, struct loop *src_parent)
2475 struct loop *src_loop = src_parent->inner;
2476 while (src_loop)
2478 if (!id->blocks_to_copy
2479 || bitmap_bit_p (id->blocks_to_copy, src_loop->header->index))
2481 struct loop *dest_loop = alloc_loop ();
2483 /* Assign the new loop its header and latch and associate
2484 those with the new loop. */
2485 dest_loop->header = (basic_block)src_loop->header->aux;
2486 dest_loop->header->loop_father = dest_loop;
2487 if (src_loop->latch != NULL)
2489 dest_loop->latch = (basic_block)src_loop->latch->aux;
2490 dest_loop->latch->loop_father = dest_loop;
2493 /* Copy loop meta-data. */
2494 copy_loop_info (src_loop, dest_loop);
2496 /* Finally place it into the loop array and the loop tree. */
2497 place_new_loop (cfun, dest_loop);
2498 flow_loop_tree_node_add (dest_parent, dest_loop);
2500 dest_loop->safelen = src_loop->safelen;
2501 dest_loop->dont_vectorize = src_loop->dont_vectorize;
2502 if (src_loop->force_vectorize)
2504 dest_loop->force_vectorize = true;
2505 cfun->has_force_vectorize_loops = true;
2507 if (src_loop->simduid)
2509 dest_loop->simduid = remap_decl (src_loop->simduid, id);
2510 cfun->has_simduid_loops = true;
2513 /* Recurse. */
2514 copy_loops (id, dest_loop, src_loop);
2516 src_loop = src_loop->next;
2520 /* Call cgraph_redirect_edge_call_stmt_to_callee on all calls in BB */
2522 void
2523 redirect_all_calls (copy_body_data * id, basic_block bb)
2525 gimple_stmt_iterator si;
2526 for (si = gsi_start_bb (bb); !gsi_end_p (si); gsi_next (&si))
2528 if (is_gimple_call (gsi_stmt (si)))
2530 struct cgraph_edge *edge = id->dst_node->get_edge (gsi_stmt (si));
2531 if (edge)
2532 edge->redirect_call_stmt_to_callee ();
2537 /* Convert estimated frequencies into counts for NODE, scaling COUNT
2538 with each bb's frequency. Used when NODE has a 0-weight entry
2539 but we are about to inline it into a non-zero count call bb.
2540 See the comments for handle_missing_profiles() in predict.c for
2541 when this can happen for COMDATs. */
2543 void
2544 freqs_to_counts (struct cgraph_node *node, gcov_type count)
2546 basic_block bb;
2547 edge_iterator ei;
2548 edge e;
2549 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2551 FOR_ALL_BB_FN(bb, fn)
2553 bb->count = apply_scale (count,
2554 GCOV_COMPUTE_SCALE (bb->frequency, BB_FREQ_MAX));
2555 FOR_EACH_EDGE (e, ei, bb->succs)
2556 e->count = apply_probability (e->src->count, e->probability);
2560 /* Make a copy of the body of FN so that it can be inserted inline in
2561 another function. Walks FN via CFG, returns new fndecl. */
2563 static tree
2564 copy_cfg_body (copy_body_data * id, gcov_type count, int frequency_scale,
2565 basic_block entry_block_map, basic_block exit_block_map,
2566 basic_block new_entry)
2568 tree callee_fndecl = id->src_fn;
2569 /* Original cfun for the callee, doesn't change. */
2570 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2571 struct function *cfun_to_copy;
2572 basic_block bb;
2573 tree new_fndecl = NULL;
2574 bool need_debug_cleanup = false;
2575 gcov_type count_scale;
2576 int last;
2577 int incoming_frequency = 0;
2578 gcov_type incoming_count = 0;
2580 /* This can happen for COMDAT routines that end up with 0 counts
2581 despite being called (see the comments for handle_missing_profiles()
2582 in predict.c as to why). Apply counts to the blocks in the callee
2583 before inlining, using the guessed edge frequencies, so that we don't
2584 end up with a 0-count inline body which can confuse downstream
2585 optimizations such as function splitting. */
2586 if (!ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count && count)
2588 /* Apply the larger of the call bb count and the total incoming
2589 call edge count to the callee. */
2590 gcov_type in_count = 0;
2591 struct cgraph_edge *in_edge;
2592 for (in_edge = id->src_node->callers; in_edge;
2593 in_edge = in_edge->next_caller)
2594 in_count += in_edge->count;
2595 freqs_to_counts (id->src_node, count > in_count ? count : in_count);
2598 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2599 count_scale
2600 = GCOV_COMPUTE_SCALE (count,
2601 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2602 else
2603 count_scale = REG_BR_PROB_BASE;
2605 /* Register specific tree functions. */
2606 gimple_register_cfg_hooks ();
2608 /* If we are inlining just region of the function, make sure to connect
2609 new entry to ENTRY_BLOCK_PTR_FOR_FN (cfun). Since new entry can be
2610 part of loop, we must compute frequency and probability of
2611 ENTRY_BLOCK_PTR_FOR_FN (cfun) based on the frequencies and
2612 probabilities of edges incoming from nonduplicated region. */
2613 if (new_entry)
2615 edge e;
2616 edge_iterator ei;
2618 FOR_EACH_EDGE (e, ei, new_entry->preds)
2619 if (!e->src->aux)
2621 incoming_frequency += EDGE_FREQUENCY (e);
2622 incoming_count += e->count;
2624 incoming_count = apply_scale (incoming_count, count_scale);
2625 incoming_frequency
2626 = apply_scale ((gcov_type)incoming_frequency, frequency_scale);
2627 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count = incoming_count;
2628 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency = incoming_frequency;
2631 /* Must have a CFG here at this point. */
2632 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN
2633 (DECL_STRUCT_FUNCTION (callee_fndecl)));
2635 cfun_to_copy = id->src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2637 ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = entry_block_map;
2638 EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = exit_block_map;
2639 entry_block_map->aux = ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy);
2640 exit_block_map->aux = EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy);
2642 /* Duplicate any exception-handling regions. */
2643 if (cfun->eh)
2644 id->eh_map = duplicate_eh_regions (cfun_to_copy, NULL, id->eh_lp_nr,
2645 remap_decl_1, id);
2647 /* Use aux pointers to map the original blocks to copy. */
2648 FOR_EACH_BB_FN (bb, cfun_to_copy)
2649 if (!id->blocks_to_copy || bitmap_bit_p (id->blocks_to_copy, bb->index))
2651 basic_block new_bb = copy_bb (id, bb, frequency_scale, count_scale);
2652 bb->aux = new_bb;
2653 new_bb->aux = bb;
2654 new_bb->loop_father = entry_block_map->loop_father;
2657 last = last_basic_block_for_fn (cfun);
2659 /* Now that we've duplicated the blocks, duplicate their edges. */
2660 basic_block abnormal_goto_dest = NULL;
2661 if (id->gimple_call
2662 && stmt_can_make_abnormal_goto (id->gimple_call))
2664 gimple_stmt_iterator gsi = gsi_for_stmt (id->gimple_call);
2666 bb = gimple_bb (id->gimple_call);
2667 gsi_next (&gsi);
2668 if (gsi_end_p (gsi))
2669 abnormal_goto_dest = get_abnormal_succ_dispatcher (bb);
2671 FOR_ALL_BB_FN (bb, cfun_to_copy)
2672 if (!id->blocks_to_copy
2673 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2674 need_debug_cleanup |= copy_edges_for_bb (bb, count_scale, exit_block_map,
2675 abnormal_goto_dest);
2677 if (new_entry)
2679 edge e = make_edge (entry_block_map, (basic_block)new_entry->aux, EDGE_FALLTHRU);
2680 e->probability = REG_BR_PROB_BASE;
2681 e->count = incoming_count;
2684 /* Duplicate the loop tree, if available and wanted. */
2685 if (loops_for_fn (src_cfun) != NULL
2686 && current_loops != NULL)
2688 copy_loops (id, entry_block_map->loop_father,
2689 get_loop (src_cfun, 0));
2690 /* Defer to cfgcleanup to update loop-father fields of basic-blocks. */
2691 loops_state_set (LOOPS_NEED_FIXUP);
2694 /* If the loop tree in the source function needed fixup, mark the
2695 destination loop tree for fixup, too. */
2696 if (loops_for_fn (src_cfun)->state & LOOPS_NEED_FIXUP)
2697 loops_state_set (LOOPS_NEED_FIXUP);
2699 if (gimple_in_ssa_p (cfun))
2700 FOR_ALL_BB_FN (bb, cfun_to_copy)
2701 if (!id->blocks_to_copy
2702 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2703 copy_phis_for_bb (bb, id);
2705 FOR_ALL_BB_FN (bb, cfun_to_copy)
2706 if (bb->aux)
2708 if (need_debug_cleanup
2709 && bb->index != ENTRY_BLOCK
2710 && bb->index != EXIT_BLOCK)
2711 maybe_move_debug_stmts_to_successors (id, (basic_block) bb->aux);
2712 /* Update call edge destinations. This can not be done before loop
2713 info is updated, because we may split basic blocks. */
2714 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2715 redirect_all_calls (id, (basic_block)bb->aux);
2716 ((basic_block)bb->aux)->aux = NULL;
2717 bb->aux = NULL;
2720 /* Zero out AUX fields of newly created block during EH edge
2721 insertion. */
2722 for (; last < last_basic_block_for_fn (cfun); last++)
2724 if (need_debug_cleanup)
2725 maybe_move_debug_stmts_to_successors (id,
2726 BASIC_BLOCK_FOR_FN (cfun, last));
2727 BASIC_BLOCK_FOR_FN (cfun, last)->aux = NULL;
2728 /* Update call edge destinations. This can not be done before loop
2729 info is updated, because we may split basic blocks. */
2730 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2731 redirect_all_calls (id, BASIC_BLOCK_FOR_FN (cfun, last));
2733 entry_block_map->aux = NULL;
2734 exit_block_map->aux = NULL;
2736 if (id->eh_map)
2738 delete id->eh_map;
2739 id->eh_map = NULL;
2742 return new_fndecl;
2745 /* Copy the debug STMT using ID. We deal with these statements in a
2746 special way: if any variable in their VALUE expression wasn't
2747 remapped yet, we won't remap it, because that would get decl uids
2748 out of sync, causing codegen differences between -g and -g0. If
2749 this arises, we drop the VALUE expression altogether. */
2751 static void
2752 copy_debug_stmt (gimple stmt, copy_body_data *id)
2754 tree t, *n;
2755 struct walk_stmt_info wi;
2757 if (gimple_block (stmt))
2759 n = id->decl_map->get (gimple_block (stmt));
2760 gimple_set_block (stmt, n ? *n : id->block);
2763 /* Remap all the operands in COPY. */
2764 memset (&wi, 0, sizeof (wi));
2765 wi.info = id;
2767 processing_debug_stmt = 1;
2769 if (gimple_debug_source_bind_p (stmt))
2770 t = gimple_debug_source_bind_get_var (stmt);
2771 else
2772 t = gimple_debug_bind_get_var (stmt);
2774 if (TREE_CODE (t) == PARM_DECL && id->debug_map
2775 && (n = id->debug_map->get (t)))
2777 gcc_assert (TREE_CODE (*n) == VAR_DECL);
2778 t = *n;
2780 else if (TREE_CODE (t) == VAR_DECL
2781 && !is_global_var (t)
2782 && !id->decl_map->get (t))
2783 /* T is a non-localized variable. */;
2784 else
2785 walk_tree (&t, remap_gimple_op_r, &wi, NULL);
2787 if (gimple_debug_bind_p (stmt))
2789 gimple_debug_bind_set_var (stmt, t);
2791 if (gimple_debug_bind_has_value_p (stmt))
2792 walk_tree (gimple_debug_bind_get_value_ptr (stmt),
2793 remap_gimple_op_r, &wi, NULL);
2795 /* Punt if any decl couldn't be remapped. */
2796 if (processing_debug_stmt < 0)
2797 gimple_debug_bind_reset_value (stmt);
2799 else if (gimple_debug_source_bind_p (stmt))
2801 gimple_debug_source_bind_set_var (stmt, t);
2802 walk_tree (gimple_debug_source_bind_get_value_ptr (stmt),
2803 remap_gimple_op_r, &wi, NULL);
2804 /* When inlining and source bind refers to one of the optimized
2805 away parameters, change the source bind into normal debug bind
2806 referring to the corresponding DEBUG_EXPR_DECL that should have
2807 been bound before the call stmt. */
2808 t = gimple_debug_source_bind_get_value (stmt);
2809 if (t != NULL_TREE
2810 && TREE_CODE (t) == PARM_DECL
2811 && id->gimple_call)
2813 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (id->src_fn);
2814 unsigned int i;
2815 if (debug_args != NULL)
2817 for (i = 0; i < vec_safe_length (*debug_args); i += 2)
2818 if ((**debug_args)[i] == DECL_ORIGIN (t)
2819 && TREE_CODE ((**debug_args)[i + 1]) == DEBUG_EXPR_DECL)
2821 t = (**debug_args)[i + 1];
2822 stmt->subcode = GIMPLE_DEBUG_BIND;
2823 gimple_debug_bind_set_value (stmt, t);
2824 break;
2830 processing_debug_stmt = 0;
2832 update_stmt (stmt);
2835 /* Process deferred debug stmts. In order to give values better odds
2836 of being successfully remapped, we delay the processing of debug
2837 stmts until all other stmts that might require remapping are
2838 processed. */
2840 static void
2841 copy_debug_stmts (copy_body_data *id)
2843 size_t i;
2844 gimple stmt;
2846 if (!id->debug_stmts.exists ())
2847 return;
2849 FOR_EACH_VEC_ELT (id->debug_stmts, i, stmt)
2850 copy_debug_stmt (stmt, id);
2852 id->debug_stmts.release ();
2855 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2856 another function. */
2858 static tree
2859 copy_tree_body (copy_body_data *id)
2861 tree fndecl = id->src_fn;
2862 tree body = DECL_SAVED_TREE (fndecl);
2864 walk_tree (&body, copy_tree_body_r, id, NULL);
2866 return body;
2869 /* Make a copy of the body of FN so that it can be inserted inline in
2870 another function. */
2872 static tree
2873 copy_body (copy_body_data *id, gcov_type count, int frequency_scale,
2874 basic_block entry_block_map, basic_block exit_block_map,
2875 basic_block new_entry)
2877 tree fndecl = id->src_fn;
2878 tree body;
2880 /* If this body has a CFG, walk CFG and copy. */
2881 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN (DECL_STRUCT_FUNCTION (fndecl)));
2882 body = copy_cfg_body (id, count, frequency_scale, entry_block_map, exit_block_map,
2883 new_entry);
2884 copy_debug_stmts (id);
2886 return body;
2889 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2890 defined in function FN, or of a data member thereof. */
2892 static bool
2893 self_inlining_addr_expr (tree value, tree fn)
2895 tree var;
2897 if (TREE_CODE (value) != ADDR_EXPR)
2898 return false;
2900 var = get_base_address (TREE_OPERAND (value, 0));
2902 return var && auto_var_in_fn_p (var, fn);
2905 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2906 lexical block and line number information from base_stmt, if given,
2907 or from the last stmt of the block otherwise. */
2909 static gimple
2910 insert_init_debug_bind (copy_body_data *id,
2911 basic_block bb, tree var, tree value,
2912 gimple base_stmt)
2914 gimple note;
2915 gimple_stmt_iterator gsi;
2916 tree tracked_var;
2918 if (!gimple_in_ssa_p (id->src_cfun))
2919 return NULL;
2921 if (!MAY_HAVE_DEBUG_STMTS)
2922 return NULL;
2924 tracked_var = target_for_debug_bind (var);
2925 if (!tracked_var)
2926 return NULL;
2928 if (bb)
2930 gsi = gsi_last_bb (bb);
2931 if (!base_stmt && !gsi_end_p (gsi))
2932 base_stmt = gsi_stmt (gsi);
2935 note = gimple_build_debug_bind (tracked_var, value, base_stmt);
2937 if (bb)
2939 if (!gsi_end_p (gsi))
2940 gsi_insert_after (&gsi, note, GSI_SAME_STMT);
2941 else
2942 gsi_insert_before (&gsi, note, GSI_SAME_STMT);
2945 return note;
2948 static void
2949 insert_init_stmt (copy_body_data *id, basic_block bb, gimple init_stmt)
2951 /* If VAR represents a zero-sized variable, it's possible that the
2952 assignment statement may result in no gimple statements. */
2953 if (init_stmt)
2955 gimple_stmt_iterator si = gsi_last_bb (bb);
2957 /* We can end up with init statements that store to a non-register
2958 from a rhs with a conversion. Handle that here by forcing the
2959 rhs into a temporary. gimple_regimplify_operands is not
2960 prepared to do this for us. */
2961 if (!is_gimple_debug (init_stmt)
2962 && !is_gimple_reg (gimple_assign_lhs (init_stmt))
2963 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt)))
2964 && gimple_assign_rhs_class (init_stmt) == GIMPLE_UNARY_RHS)
2966 tree rhs = build1 (gimple_assign_rhs_code (init_stmt),
2967 gimple_expr_type (init_stmt),
2968 gimple_assign_rhs1 (init_stmt));
2969 rhs = force_gimple_operand_gsi (&si, rhs, true, NULL_TREE, false,
2970 GSI_NEW_STMT);
2971 gimple_assign_set_rhs_code (init_stmt, TREE_CODE (rhs));
2972 gimple_assign_set_rhs1 (init_stmt, rhs);
2974 gsi_insert_after (&si, init_stmt, GSI_NEW_STMT);
2975 gimple_regimplify_operands (init_stmt, &si);
2977 if (!is_gimple_debug (init_stmt) && MAY_HAVE_DEBUG_STMTS)
2979 tree def = gimple_assign_lhs (init_stmt);
2980 insert_init_debug_bind (id, bb, def, def, init_stmt);
2985 /* Initialize parameter P with VALUE. If needed, produce init statement
2986 at the end of BB. When BB is NULL, we return init statement to be
2987 output later. */
2988 static gimple
2989 setup_one_parameter (copy_body_data *id, tree p, tree value, tree fn,
2990 basic_block bb, tree *vars)
2992 gimple init_stmt = NULL;
2993 tree var;
2994 tree rhs = value;
2995 tree def = (gimple_in_ssa_p (cfun)
2996 ? ssa_default_def (id->src_cfun, p) : NULL);
2998 if (value
2999 && value != error_mark_node
3000 && !useless_type_conversion_p (TREE_TYPE (p), TREE_TYPE (value)))
3002 /* If we can match up types by promotion/demotion do so. */
3003 if (fold_convertible_p (TREE_TYPE (p), value))
3004 rhs = fold_convert (TREE_TYPE (p), value);
3005 else
3007 /* ??? For valid programs we should not end up here.
3008 Still if we end up with truly mismatched types here, fall back
3009 to using a VIEW_CONVERT_EXPR or a literal zero to not leak invalid
3010 GIMPLE to the following passes. */
3011 if (!is_gimple_reg_type (TREE_TYPE (value))
3012 || TYPE_SIZE (TREE_TYPE (p)) == TYPE_SIZE (TREE_TYPE (value)))
3013 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (p), value);
3014 else
3015 rhs = build_zero_cst (TREE_TYPE (p));
3019 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
3020 here since the type of this decl must be visible to the calling
3021 function. */
3022 var = copy_decl_to_var (p, id);
3024 /* Declare this new variable. */
3025 DECL_CHAIN (var) = *vars;
3026 *vars = var;
3028 /* Make gimplifier happy about this variable. */
3029 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
3031 /* If the parameter is never assigned to, has no SSA_NAMEs created,
3032 we would not need to create a new variable here at all, if it
3033 weren't for debug info. Still, we can just use the argument
3034 value. */
3035 if (TREE_READONLY (p)
3036 && !TREE_ADDRESSABLE (p)
3037 && value && !TREE_SIDE_EFFECTS (value)
3038 && !def)
3040 /* We may produce non-gimple trees by adding NOPs or introduce
3041 invalid sharing when operand is not really constant.
3042 It is not big deal to prohibit constant propagation here as
3043 we will constant propagate in DOM1 pass anyway. */
3044 if (is_gimple_min_invariant (value)
3045 && useless_type_conversion_p (TREE_TYPE (p),
3046 TREE_TYPE (value))
3047 /* We have to be very careful about ADDR_EXPR. Make sure
3048 the base variable isn't a local variable of the inlined
3049 function, e.g., when doing recursive inlining, direct or
3050 mutually-recursive or whatever, which is why we don't
3051 just test whether fn == current_function_decl. */
3052 && ! self_inlining_addr_expr (value, fn))
3054 insert_decl_map (id, p, value);
3055 insert_debug_decl_map (id, p, var);
3056 return insert_init_debug_bind (id, bb, var, value, NULL);
3060 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
3061 that way, when the PARM_DECL is encountered, it will be
3062 automatically replaced by the VAR_DECL. */
3063 insert_decl_map (id, p, var);
3065 /* Even if P was TREE_READONLY, the new VAR should not be.
3066 In the original code, we would have constructed a
3067 temporary, and then the function body would have never
3068 changed the value of P. However, now, we will be
3069 constructing VAR directly. The constructor body may
3070 change its value multiple times as it is being
3071 constructed. Therefore, it must not be TREE_READONLY;
3072 the back-end assumes that TREE_READONLY variable is
3073 assigned to only once. */
3074 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p)))
3075 TREE_READONLY (var) = 0;
3077 /* If there is no setup required and we are in SSA, take the easy route
3078 replacing all SSA names representing the function parameter by the
3079 SSA name passed to function.
3081 We need to construct map for the variable anyway as it might be used
3082 in different SSA names when parameter is set in function.
3084 Do replacement at -O0 for const arguments replaced by constant.
3085 This is important for builtin_constant_p and other construct requiring
3086 constant argument to be visible in inlined function body. */
3087 if (gimple_in_ssa_p (cfun) && rhs && def && is_gimple_reg (p)
3088 && (optimize
3089 || (TREE_READONLY (p)
3090 && is_gimple_min_invariant (rhs)))
3091 && (TREE_CODE (rhs) == SSA_NAME
3092 || is_gimple_min_invariant (rhs))
3093 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def))
3095 insert_decl_map (id, def, rhs);
3096 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3099 /* If the value of argument is never used, don't care about initializing
3100 it. */
3101 if (optimize && gimple_in_ssa_p (cfun) && !def && is_gimple_reg (p))
3103 gcc_assert (!value || !TREE_SIDE_EFFECTS (value));
3104 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3107 /* Initialize this VAR_DECL from the equivalent argument. Convert
3108 the argument to the proper type in case it was promoted. */
3109 if (value)
3111 if (rhs == error_mark_node)
3113 insert_decl_map (id, p, var);
3114 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3117 STRIP_USELESS_TYPE_CONVERSION (rhs);
3119 /* If we are in SSA form properly remap the default definition
3120 or assign to a dummy SSA name if the parameter is unused and
3121 we are not optimizing. */
3122 if (gimple_in_ssa_p (cfun) && is_gimple_reg (p))
3124 if (def)
3126 def = remap_ssa_name (def, id);
3127 init_stmt = gimple_build_assign (def, rhs);
3128 SSA_NAME_IS_DEFAULT_DEF (def) = 0;
3129 set_ssa_default_def (cfun, var, NULL);
3131 else if (!optimize)
3133 def = make_ssa_name (var, NULL);
3134 init_stmt = gimple_build_assign (def, rhs);
3137 else
3138 init_stmt = gimple_build_assign (var, rhs);
3140 if (bb && init_stmt)
3141 insert_init_stmt (id, bb, init_stmt);
3143 return init_stmt;
3146 /* Generate code to initialize the parameters of the function at the
3147 top of the stack in ID from the GIMPLE_CALL STMT. */
3149 static void
3150 initialize_inlined_parameters (copy_body_data *id, gimple stmt,
3151 tree fn, basic_block bb)
3153 tree parms;
3154 size_t i;
3155 tree p;
3156 tree vars = NULL_TREE;
3157 tree static_chain = gimple_call_chain (stmt);
3159 /* Figure out what the parameters are. */
3160 parms = DECL_ARGUMENTS (fn);
3162 /* Loop through the parameter declarations, replacing each with an
3163 equivalent VAR_DECL, appropriately initialized. */
3164 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3166 tree val;
3167 val = i < gimple_call_num_args (stmt) ? gimple_call_arg (stmt, i) : NULL;
3168 setup_one_parameter (id, p, val, fn, bb, &vars);
3170 /* After remapping parameters remap their types. This has to be done
3171 in a second loop over all parameters to appropriately remap
3172 variable sized arrays when the size is specified in a
3173 parameter following the array. */
3174 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3176 tree *varp = id->decl_map->get (p);
3177 if (varp
3178 && TREE_CODE (*varp) == VAR_DECL)
3180 tree def = (gimple_in_ssa_p (cfun) && is_gimple_reg (p)
3181 ? ssa_default_def (id->src_cfun, p) : NULL);
3182 tree var = *varp;
3183 TREE_TYPE (var) = remap_type (TREE_TYPE (var), id);
3184 /* Also remap the default definition if it was remapped
3185 to the default definition of the parameter replacement
3186 by the parameter setup. */
3187 if (def)
3189 tree *defp = id->decl_map->get (def);
3190 if (defp
3191 && TREE_CODE (*defp) == SSA_NAME
3192 && SSA_NAME_VAR (*defp) == var)
3193 TREE_TYPE (*defp) = TREE_TYPE (var);
3198 /* Initialize the static chain. */
3199 p = DECL_STRUCT_FUNCTION (fn)->static_chain_decl;
3200 gcc_assert (fn != current_function_decl);
3201 if (p)
3203 /* No static chain? Seems like a bug in tree-nested.c. */
3204 gcc_assert (static_chain);
3206 setup_one_parameter (id, p, static_chain, fn, bb, &vars);
3209 declare_inline_vars (id->block, vars);
3213 /* Declare a return variable to replace the RESULT_DECL for the
3214 function we are calling. An appropriate DECL_STMT is returned.
3215 The USE_STMT is filled to contain a use of the declaration to
3216 indicate the return value of the function.
3218 RETURN_SLOT, if non-null is place where to store the result. It
3219 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
3220 was the LHS of the MODIFY_EXPR to which this call is the RHS.
3222 RETURN_BOUNDS holds a destination for returned bounds.
3224 The return value is a (possibly null) value that holds the result
3225 as seen by the caller. */
3227 static tree
3228 declare_return_variable (copy_body_data *id, tree return_slot, tree modify_dest,
3229 tree return_bounds, basic_block entry_bb)
3231 tree callee = id->src_fn;
3232 tree result = DECL_RESULT (callee);
3233 tree callee_type = TREE_TYPE (result);
3234 tree caller_type;
3235 tree var, use;
3237 /* Handle type-mismatches in the function declaration return type
3238 vs. the call expression. */
3239 if (modify_dest)
3240 caller_type = TREE_TYPE (modify_dest);
3241 else
3242 caller_type = TREE_TYPE (TREE_TYPE (callee));
3244 /* We don't need to do anything for functions that don't return anything. */
3245 if (VOID_TYPE_P (callee_type))
3246 return NULL_TREE;
3248 /* If there was a return slot, then the return value is the
3249 dereferenced address of that object. */
3250 if (return_slot)
3252 /* The front end shouldn't have used both return_slot and
3253 a modify expression. */
3254 gcc_assert (!modify_dest);
3255 if (DECL_BY_REFERENCE (result))
3257 tree return_slot_addr = build_fold_addr_expr (return_slot);
3258 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr);
3260 /* We are going to construct *&return_slot and we can't do that
3261 for variables believed to be not addressable.
3263 FIXME: This check possibly can match, because values returned
3264 via return slot optimization are not believed to have address
3265 taken by alias analysis. */
3266 gcc_assert (TREE_CODE (return_slot) != SSA_NAME);
3267 var = return_slot_addr;
3269 else
3271 var = return_slot;
3272 gcc_assert (TREE_CODE (var) != SSA_NAME);
3273 if (TREE_ADDRESSABLE (result))
3274 mark_addressable (var);
3276 if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3277 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3278 && !DECL_GIMPLE_REG_P (result)
3279 && DECL_P (var))
3280 DECL_GIMPLE_REG_P (var) = 0;
3281 use = NULL;
3282 goto done;
3285 /* All types requiring non-trivial constructors should have been handled. */
3286 gcc_assert (!TREE_ADDRESSABLE (callee_type));
3288 /* Attempt to avoid creating a new temporary variable. */
3289 if (modify_dest
3290 && TREE_CODE (modify_dest) != SSA_NAME)
3292 bool use_it = false;
3294 /* We can't use MODIFY_DEST if there's type promotion involved. */
3295 if (!useless_type_conversion_p (callee_type, caller_type))
3296 use_it = false;
3298 /* ??? If we're assigning to a variable sized type, then we must
3299 reuse the destination variable, because we've no good way to
3300 create variable sized temporaries at this point. */
3301 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type)) != INTEGER_CST)
3302 use_it = true;
3304 /* If the callee cannot possibly modify MODIFY_DEST, then we can
3305 reuse it as the result of the call directly. Don't do this if
3306 it would promote MODIFY_DEST to addressable. */
3307 else if (TREE_ADDRESSABLE (result))
3308 use_it = false;
3309 else
3311 tree base_m = get_base_address (modify_dest);
3313 /* If the base isn't a decl, then it's a pointer, and we don't
3314 know where that's going to go. */
3315 if (!DECL_P (base_m))
3316 use_it = false;
3317 else if (is_global_var (base_m))
3318 use_it = false;
3319 else if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3320 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3321 && !DECL_GIMPLE_REG_P (result)
3322 && DECL_GIMPLE_REG_P (base_m))
3323 use_it = false;
3324 else if (!TREE_ADDRESSABLE (base_m))
3325 use_it = true;
3328 if (use_it)
3330 var = modify_dest;
3331 use = NULL;
3332 goto done;
3336 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type)) == INTEGER_CST);
3338 var = copy_result_decl_to_var (result, id);
3339 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
3341 /* Do not have the rest of GCC warn about this variable as it should
3342 not be visible to the user. */
3343 TREE_NO_WARNING (var) = 1;
3345 declare_inline_vars (id->block, var);
3347 /* Build the use expr. If the return type of the function was
3348 promoted, convert it back to the expected type. */
3349 use = var;
3350 if (!useless_type_conversion_p (caller_type, TREE_TYPE (var)))
3352 /* If we can match up types by promotion/demotion do so. */
3353 if (fold_convertible_p (caller_type, var))
3354 use = fold_convert (caller_type, var);
3355 else
3357 /* ??? For valid programs we should not end up here.
3358 Still if we end up with truly mismatched types here, fall back
3359 to using a MEM_REF to not leak invalid GIMPLE to the following
3360 passes. */
3361 /* Prevent var from being written into SSA form. */
3362 if (TREE_CODE (TREE_TYPE (var)) == VECTOR_TYPE
3363 || TREE_CODE (TREE_TYPE (var)) == COMPLEX_TYPE)
3364 DECL_GIMPLE_REG_P (var) = false;
3365 else if (is_gimple_reg_type (TREE_TYPE (var)))
3366 TREE_ADDRESSABLE (var) = true;
3367 use = fold_build2 (MEM_REF, caller_type,
3368 build_fold_addr_expr (var),
3369 build_int_cst (ptr_type_node, 0));
3373 STRIP_USELESS_TYPE_CONVERSION (use);
3375 if (DECL_BY_REFERENCE (result))
3377 TREE_ADDRESSABLE (var) = 1;
3378 var = build_fold_addr_expr (var);
3381 done:
3382 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
3383 way, when the RESULT_DECL is encountered, it will be
3384 automatically replaced by the VAR_DECL.
3386 When returning by reference, ensure that RESULT_DECL remaps to
3387 gimple_val. */
3388 if (DECL_BY_REFERENCE (result)
3389 && !is_gimple_val (var))
3391 tree temp = create_tmp_var (TREE_TYPE (result), "retvalptr");
3392 insert_decl_map (id, result, temp);
3393 /* When RESULT_DECL is in SSA form, we need to remap and initialize
3394 it's default_def SSA_NAME. */
3395 if (gimple_in_ssa_p (id->src_cfun)
3396 && is_gimple_reg (result))
3398 temp = make_ssa_name (temp, NULL);
3399 insert_decl_map (id, ssa_default_def (id->src_cfun, result), temp);
3401 insert_init_stmt (id, entry_bb, gimple_build_assign (temp, var));
3403 else
3404 insert_decl_map (id, result, var);
3406 /* Remember this so we can ignore it in remap_decls. */
3407 id->retvar = var;
3409 /* If returned bounds are used, then make var for them. */
3410 if (return_bounds)
3412 tree bndtemp = create_tmp_var (pointer_bounds_type_node, "retbnd");
3413 DECL_SEEN_IN_BIND_EXPR_P (bndtemp) = 1;
3414 TREE_NO_WARNING (bndtemp) = 1;
3415 declare_inline_vars (id->block, bndtemp);
3417 id->retbnd = bndtemp;
3418 insert_init_stmt (id, entry_bb,
3419 gimple_build_assign (bndtemp, chkp_get_zero_bounds_var ()));
3422 return use;
3425 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
3426 to a local label. */
3428 static tree
3429 has_label_address_in_static_1 (tree *nodep, int *walk_subtrees, void *fnp)
3431 tree node = *nodep;
3432 tree fn = (tree) fnp;
3434 if (TREE_CODE (node) == LABEL_DECL && DECL_CONTEXT (node) == fn)
3435 return node;
3437 if (TYPE_P (node))
3438 *walk_subtrees = 0;
3440 return NULL_TREE;
3443 /* Determine if the function can be copied. If so return NULL. If
3444 not return a string describng the reason for failure. */
3446 static const char *
3447 copy_forbidden (struct function *fun, tree fndecl)
3449 const char *reason = fun->cannot_be_copied_reason;
3450 tree decl;
3451 unsigned ix;
3453 /* Only examine the function once. */
3454 if (fun->cannot_be_copied_set)
3455 return reason;
3457 /* We cannot copy a function that receives a non-local goto
3458 because we cannot remap the destination label used in the
3459 function that is performing the non-local goto. */
3460 /* ??? Actually, this should be possible, if we work at it.
3461 No doubt there's just a handful of places that simply
3462 assume it doesn't happen and don't substitute properly. */
3463 if (fun->has_nonlocal_label)
3465 reason = G_("function %q+F can never be copied "
3466 "because it receives a non-local goto");
3467 goto fail;
3470 FOR_EACH_LOCAL_DECL (fun, ix, decl)
3471 if (TREE_CODE (decl) == VAR_DECL
3472 && TREE_STATIC (decl)
3473 && !DECL_EXTERNAL (decl)
3474 && DECL_INITIAL (decl)
3475 && walk_tree_without_duplicates (&DECL_INITIAL (decl),
3476 has_label_address_in_static_1,
3477 fndecl))
3479 reason = G_("function %q+F can never be copied because it saves "
3480 "address of local label in a static variable");
3481 goto fail;
3484 fail:
3485 fun->cannot_be_copied_reason = reason;
3486 fun->cannot_be_copied_set = true;
3487 return reason;
3491 static const char *inline_forbidden_reason;
3493 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3494 iff a function can not be inlined. Also sets the reason why. */
3496 static tree
3497 inline_forbidden_p_stmt (gimple_stmt_iterator *gsi, bool *handled_ops_p,
3498 struct walk_stmt_info *wip)
3500 tree fn = (tree) wip->info;
3501 tree t;
3502 gimple stmt = gsi_stmt (*gsi);
3504 switch (gimple_code (stmt))
3506 case GIMPLE_CALL:
3507 /* Refuse to inline alloca call unless user explicitly forced so as
3508 this may change program's memory overhead drastically when the
3509 function using alloca is called in loop. In GCC present in
3510 SPEC2000 inlining into schedule_block cause it to require 2GB of
3511 RAM instead of 256MB. Don't do so for alloca calls emitted for
3512 VLA objects as those can't cause unbounded growth (they're always
3513 wrapped inside stack_save/stack_restore regions. */
3514 if (gimple_alloca_call_p (stmt)
3515 && !gimple_call_alloca_for_var_p (stmt)
3516 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
3518 inline_forbidden_reason
3519 = G_("function %q+F can never be inlined because it uses "
3520 "alloca (override using the always_inline attribute)");
3521 *handled_ops_p = true;
3522 return fn;
3525 t = gimple_call_fndecl (stmt);
3526 if (t == NULL_TREE)
3527 break;
3529 /* We cannot inline functions that call setjmp. */
3530 if (setjmp_call_p (t))
3532 inline_forbidden_reason
3533 = G_("function %q+F can never be inlined because it uses setjmp");
3534 *handled_ops_p = true;
3535 return t;
3538 if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL)
3539 switch (DECL_FUNCTION_CODE (t))
3541 /* We cannot inline functions that take a variable number of
3542 arguments. */
3543 case BUILT_IN_VA_START:
3544 case BUILT_IN_NEXT_ARG:
3545 case BUILT_IN_VA_END:
3546 inline_forbidden_reason
3547 = G_("function %q+F can never be inlined because it "
3548 "uses variable argument lists");
3549 *handled_ops_p = true;
3550 return t;
3552 case BUILT_IN_LONGJMP:
3553 /* We can't inline functions that call __builtin_longjmp at
3554 all. The non-local goto machinery really requires the
3555 destination be in a different function. If we allow the
3556 function calling __builtin_longjmp to be inlined into the
3557 function calling __builtin_setjmp, Things will Go Awry. */
3558 inline_forbidden_reason
3559 = G_("function %q+F can never be inlined because "
3560 "it uses setjmp-longjmp exception handling");
3561 *handled_ops_p = true;
3562 return t;
3564 case BUILT_IN_NONLOCAL_GOTO:
3565 /* Similarly. */
3566 inline_forbidden_reason
3567 = G_("function %q+F can never be inlined because "
3568 "it uses non-local goto");
3569 *handled_ops_p = true;
3570 return t;
3572 case BUILT_IN_RETURN:
3573 case BUILT_IN_APPLY_ARGS:
3574 /* If a __builtin_apply_args caller would be inlined,
3575 it would be saving arguments of the function it has
3576 been inlined into. Similarly __builtin_return would
3577 return from the function the inline has been inlined into. */
3578 inline_forbidden_reason
3579 = G_("function %q+F can never be inlined because "
3580 "it uses __builtin_return or __builtin_apply_args");
3581 *handled_ops_p = true;
3582 return t;
3584 default:
3585 break;
3587 break;
3589 case GIMPLE_GOTO:
3590 t = gimple_goto_dest (stmt);
3592 /* We will not inline a function which uses computed goto. The
3593 addresses of its local labels, which may be tucked into
3594 global storage, are of course not constant across
3595 instantiations, which causes unexpected behavior. */
3596 if (TREE_CODE (t) != LABEL_DECL)
3598 inline_forbidden_reason
3599 = G_("function %q+F can never be inlined "
3600 "because it contains a computed goto");
3601 *handled_ops_p = true;
3602 return t;
3604 break;
3606 default:
3607 break;
3610 *handled_ops_p = false;
3611 return NULL_TREE;
3614 /* Return true if FNDECL is a function that cannot be inlined into
3615 another one. */
3617 static bool
3618 inline_forbidden_p (tree fndecl)
3620 struct function *fun = DECL_STRUCT_FUNCTION (fndecl);
3621 struct walk_stmt_info wi;
3622 basic_block bb;
3623 bool forbidden_p = false;
3625 /* First check for shared reasons not to copy the code. */
3626 inline_forbidden_reason = copy_forbidden (fun, fndecl);
3627 if (inline_forbidden_reason != NULL)
3628 return true;
3630 /* Next, walk the statements of the function looking for
3631 constraucts we can't handle, or are non-optimal for inlining. */
3632 hash_set<tree> visited_nodes;
3633 memset (&wi, 0, sizeof (wi));
3634 wi.info = (void *) fndecl;
3635 wi.pset = &visited_nodes;
3637 FOR_EACH_BB_FN (bb, fun)
3639 gimple ret;
3640 gimple_seq seq = bb_seq (bb);
3641 ret = walk_gimple_seq (seq, inline_forbidden_p_stmt, NULL, &wi);
3642 forbidden_p = (ret != NULL);
3643 if (forbidden_p)
3644 break;
3647 return forbidden_p;
3650 /* Return false if the function FNDECL cannot be inlined on account of its
3651 attributes, true otherwise. */
3652 static bool
3653 function_attribute_inlinable_p (const_tree fndecl)
3655 if (targetm.attribute_table)
3657 const_tree a;
3659 for (a = DECL_ATTRIBUTES (fndecl); a; a = TREE_CHAIN (a))
3661 const_tree name = TREE_PURPOSE (a);
3662 int i;
3664 for (i = 0; targetm.attribute_table[i].name != NULL; i++)
3665 if (is_attribute_p (targetm.attribute_table[i].name, name))
3666 return targetm.function_attribute_inlinable_p (fndecl);
3670 return true;
3673 /* Returns nonzero if FN is a function that does not have any
3674 fundamental inline blocking properties. */
3676 bool
3677 tree_inlinable_function_p (tree fn)
3679 bool inlinable = true;
3680 bool do_warning;
3681 tree always_inline;
3683 /* If we've already decided this function shouldn't be inlined,
3684 there's no need to check again. */
3685 if (DECL_UNINLINABLE (fn))
3686 return false;
3688 /* We only warn for functions declared `inline' by the user. */
3689 do_warning = (warn_inline
3690 && DECL_DECLARED_INLINE_P (fn)
3691 && !DECL_NO_INLINE_WARNING_P (fn)
3692 && !DECL_IN_SYSTEM_HEADER (fn));
3694 always_inline = lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn));
3696 if (flag_no_inline
3697 && always_inline == NULL)
3699 if (do_warning)
3700 warning (OPT_Winline, "function %q+F can never be inlined because it "
3701 "is suppressed using -fno-inline", fn);
3702 inlinable = false;
3705 else if (!function_attribute_inlinable_p (fn))
3707 if (do_warning)
3708 warning (OPT_Winline, "function %q+F can never be inlined because it "
3709 "uses attributes conflicting with inlining", fn);
3710 inlinable = false;
3713 else if (inline_forbidden_p (fn))
3715 /* See if we should warn about uninlinable functions. Previously,
3716 some of these warnings would be issued while trying to expand
3717 the function inline, but that would cause multiple warnings
3718 about functions that would for example call alloca. But since
3719 this a property of the function, just one warning is enough.
3720 As a bonus we can now give more details about the reason why a
3721 function is not inlinable. */
3722 if (always_inline)
3723 error (inline_forbidden_reason, fn);
3724 else if (do_warning)
3725 warning (OPT_Winline, inline_forbidden_reason, fn);
3727 inlinable = false;
3730 /* Squirrel away the result so that we don't have to check again. */
3731 DECL_UNINLINABLE (fn) = !inlinable;
3733 return inlinable;
3736 /* Estimate the cost of a memory move of type TYPE. Use machine dependent
3737 word size and take possible memcpy call into account and return
3738 cost based on whether optimizing for size or speed according to SPEED_P. */
3741 estimate_move_cost (tree type, bool ARG_UNUSED (speed_p))
3743 HOST_WIDE_INT size;
3745 gcc_assert (!VOID_TYPE_P (type));
3747 if (TREE_CODE (type) == VECTOR_TYPE)
3749 machine_mode inner = TYPE_MODE (TREE_TYPE (type));
3750 machine_mode simd
3751 = targetm.vectorize.preferred_simd_mode (inner);
3752 int simd_mode_size = GET_MODE_SIZE (simd);
3753 return ((GET_MODE_SIZE (TYPE_MODE (type)) + simd_mode_size - 1)
3754 / simd_mode_size);
3757 size = int_size_in_bytes (type);
3759 if (size < 0 || size > MOVE_MAX_PIECES * MOVE_RATIO (speed_p))
3760 /* Cost of a memcpy call, 3 arguments and the call. */
3761 return 4;
3762 else
3763 return ((size + MOVE_MAX_PIECES - 1) / MOVE_MAX_PIECES);
3766 /* Returns cost of operation CODE, according to WEIGHTS */
3768 static int
3769 estimate_operator_cost (enum tree_code code, eni_weights *weights,
3770 tree op1 ATTRIBUTE_UNUSED, tree op2)
3772 switch (code)
3774 /* These are "free" conversions, or their presumed cost
3775 is folded into other operations. */
3776 case RANGE_EXPR:
3777 CASE_CONVERT:
3778 case COMPLEX_EXPR:
3779 case PAREN_EXPR:
3780 case VIEW_CONVERT_EXPR:
3781 return 0;
3783 /* Assign cost of 1 to usual operations.
3784 ??? We may consider mapping RTL costs to this. */
3785 case COND_EXPR:
3786 case VEC_COND_EXPR:
3787 case VEC_PERM_EXPR:
3789 case PLUS_EXPR:
3790 case POINTER_PLUS_EXPR:
3791 case MINUS_EXPR:
3792 case MULT_EXPR:
3793 case MULT_HIGHPART_EXPR:
3794 case FMA_EXPR:
3796 case ADDR_SPACE_CONVERT_EXPR:
3797 case FIXED_CONVERT_EXPR:
3798 case FIX_TRUNC_EXPR:
3800 case NEGATE_EXPR:
3801 case FLOAT_EXPR:
3802 case MIN_EXPR:
3803 case MAX_EXPR:
3804 case ABS_EXPR:
3806 case LSHIFT_EXPR:
3807 case RSHIFT_EXPR:
3808 case LROTATE_EXPR:
3809 case RROTATE_EXPR:
3811 case BIT_IOR_EXPR:
3812 case BIT_XOR_EXPR:
3813 case BIT_AND_EXPR:
3814 case BIT_NOT_EXPR:
3816 case TRUTH_ANDIF_EXPR:
3817 case TRUTH_ORIF_EXPR:
3818 case TRUTH_AND_EXPR:
3819 case TRUTH_OR_EXPR:
3820 case TRUTH_XOR_EXPR:
3821 case TRUTH_NOT_EXPR:
3823 case LT_EXPR:
3824 case LE_EXPR:
3825 case GT_EXPR:
3826 case GE_EXPR:
3827 case EQ_EXPR:
3828 case NE_EXPR:
3829 case ORDERED_EXPR:
3830 case UNORDERED_EXPR:
3832 case UNLT_EXPR:
3833 case UNLE_EXPR:
3834 case UNGT_EXPR:
3835 case UNGE_EXPR:
3836 case UNEQ_EXPR:
3837 case LTGT_EXPR:
3839 case CONJ_EXPR:
3841 case PREDECREMENT_EXPR:
3842 case PREINCREMENT_EXPR:
3843 case POSTDECREMENT_EXPR:
3844 case POSTINCREMENT_EXPR:
3846 case REALIGN_LOAD_EXPR:
3848 case REDUC_MAX_EXPR:
3849 case REDUC_MIN_EXPR:
3850 case REDUC_PLUS_EXPR:
3851 case WIDEN_SUM_EXPR:
3852 case WIDEN_MULT_EXPR:
3853 case DOT_PROD_EXPR:
3854 case SAD_EXPR:
3855 case WIDEN_MULT_PLUS_EXPR:
3856 case WIDEN_MULT_MINUS_EXPR:
3857 case WIDEN_LSHIFT_EXPR:
3859 case VEC_WIDEN_MULT_HI_EXPR:
3860 case VEC_WIDEN_MULT_LO_EXPR:
3861 case VEC_WIDEN_MULT_EVEN_EXPR:
3862 case VEC_WIDEN_MULT_ODD_EXPR:
3863 case VEC_UNPACK_HI_EXPR:
3864 case VEC_UNPACK_LO_EXPR:
3865 case VEC_UNPACK_FLOAT_HI_EXPR:
3866 case VEC_UNPACK_FLOAT_LO_EXPR:
3867 case VEC_PACK_TRUNC_EXPR:
3868 case VEC_PACK_SAT_EXPR:
3869 case VEC_PACK_FIX_TRUNC_EXPR:
3870 case VEC_WIDEN_LSHIFT_HI_EXPR:
3871 case VEC_WIDEN_LSHIFT_LO_EXPR:
3873 return 1;
3875 /* Few special cases of expensive operations. This is useful
3876 to avoid inlining on functions having too many of these. */
3877 case TRUNC_DIV_EXPR:
3878 case CEIL_DIV_EXPR:
3879 case FLOOR_DIV_EXPR:
3880 case ROUND_DIV_EXPR:
3881 case EXACT_DIV_EXPR:
3882 case TRUNC_MOD_EXPR:
3883 case CEIL_MOD_EXPR:
3884 case FLOOR_MOD_EXPR:
3885 case ROUND_MOD_EXPR:
3886 case RDIV_EXPR:
3887 if (TREE_CODE (op2) != INTEGER_CST)
3888 return weights->div_mod_cost;
3889 return 1;
3891 default:
3892 /* We expect a copy assignment with no operator. */
3893 gcc_assert (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS);
3894 return 0;
3899 /* Estimate number of instructions that will be created by expanding
3900 the statements in the statement sequence STMTS.
3901 WEIGHTS contains weights attributed to various constructs. */
3903 static
3904 int estimate_num_insns_seq (gimple_seq stmts, eni_weights *weights)
3906 int cost;
3907 gimple_stmt_iterator gsi;
3909 cost = 0;
3910 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
3911 cost += estimate_num_insns (gsi_stmt (gsi), weights);
3913 return cost;
3917 /* Estimate number of instructions that will be created by expanding STMT.
3918 WEIGHTS contains weights attributed to various constructs. */
3921 estimate_num_insns (gimple stmt, eni_weights *weights)
3923 unsigned cost, i;
3924 enum gimple_code code = gimple_code (stmt);
3925 tree lhs;
3926 tree rhs;
3928 switch (code)
3930 case GIMPLE_ASSIGN:
3931 /* Try to estimate the cost of assignments. We have three cases to
3932 deal with:
3933 1) Simple assignments to registers;
3934 2) Stores to things that must live in memory. This includes
3935 "normal" stores to scalars, but also assignments of large
3936 structures, or constructors of big arrays;
3938 Let us look at the first two cases, assuming we have "a = b + C":
3939 <GIMPLE_ASSIGN <var_decl "a">
3940 <plus_expr <var_decl "b"> <constant C>>
3941 If "a" is a GIMPLE register, the assignment to it is free on almost
3942 any target, because "a" usually ends up in a real register. Hence
3943 the only cost of this expression comes from the PLUS_EXPR, and we
3944 can ignore the GIMPLE_ASSIGN.
3945 If "a" is not a GIMPLE register, the assignment to "a" will most
3946 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3947 of moving something into "a", which we compute using the function
3948 estimate_move_cost. */
3949 if (gimple_clobber_p (stmt))
3950 return 0; /* ={v} {CLOBBER} stmt expands to nothing. */
3952 lhs = gimple_assign_lhs (stmt);
3953 rhs = gimple_assign_rhs1 (stmt);
3955 cost = 0;
3957 /* Account for the cost of moving to / from memory. */
3958 if (gimple_store_p (stmt))
3959 cost += estimate_move_cost (TREE_TYPE (lhs), weights->time_based);
3960 if (gimple_assign_load_p (stmt))
3961 cost += estimate_move_cost (TREE_TYPE (rhs), weights->time_based);
3963 cost += estimate_operator_cost (gimple_assign_rhs_code (stmt), weights,
3964 gimple_assign_rhs1 (stmt),
3965 get_gimple_rhs_class (gimple_assign_rhs_code (stmt))
3966 == GIMPLE_BINARY_RHS
3967 ? gimple_assign_rhs2 (stmt) : NULL);
3968 break;
3970 case GIMPLE_COND:
3971 cost = 1 + estimate_operator_cost (gimple_cond_code (stmt), weights,
3972 gimple_op (stmt, 0),
3973 gimple_op (stmt, 1));
3974 break;
3976 case GIMPLE_SWITCH:
3977 /* Take into account cost of the switch + guess 2 conditional jumps for
3978 each case label.
3980 TODO: once the switch expansion logic is sufficiently separated, we can
3981 do better job on estimating cost of the switch. */
3982 if (weights->time_based)
3983 cost = floor_log2 (gimple_switch_num_labels (stmt)) * 2;
3984 else
3985 cost = gimple_switch_num_labels (stmt) * 2;
3986 break;
3988 case GIMPLE_CALL:
3990 tree decl;
3992 if (gimple_call_internal_p (stmt))
3993 return 0;
3994 else if ((decl = gimple_call_fndecl (stmt))
3995 && DECL_BUILT_IN (decl))
3997 /* Do not special case builtins where we see the body.
3998 This just confuse inliner. */
3999 struct cgraph_node *node;
4000 if (!(node = cgraph_node::get (decl))
4001 || node->definition)
4003 /* For buitins that are likely expanded to nothing or
4004 inlined do not account operand costs. */
4005 else if (is_simple_builtin (decl))
4006 return 0;
4007 else if (is_inexpensive_builtin (decl))
4008 return weights->target_builtin_call_cost;
4009 else if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
4011 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
4012 specialize the cheap expansion we do here.
4013 ??? This asks for a more general solution. */
4014 switch (DECL_FUNCTION_CODE (decl))
4016 case BUILT_IN_POW:
4017 case BUILT_IN_POWF:
4018 case BUILT_IN_POWL:
4019 if (TREE_CODE (gimple_call_arg (stmt, 1)) == REAL_CST
4020 && REAL_VALUES_EQUAL
4021 (TREE_REAL_CST (gimple_call_arg (stmt, 1)), dconst2))
4022 return estimate_operator_cost
4023 (MULT_EXPR, weights, gimple_call_arg (stmt, 0),
4024 gimple_call_arg (stmt, 0));
4025 break;
4027 default:
4028 break;
4033 cost = decl ? weights->call_cost : weights->indirect_call_cost;
4034 if (gimple_call_lhs (stmt))
4035 cost += estimate_move_cost (TREE_TYPE (gimple_call_lhs (stmt)),
4036 weights->time_based);
4037 for (i = 0; i < gimple_call_num_args (stmt); i++)
4039 tree arg = gimple_call_arg (stmt, i);
4040 cost += estimate_move_cost (TREE_TYPE (arg),
4041 weights->time_based);
4043 break;
4046 case GIMPLE_RETURN:
4047 return weights->return_cost;
4049 case GIMPLE_GOTO:
4050 case GIMPLE_LABEL:
4051 case GIMPLE_NOP:
4052 case GIMPLE_PHI:
4053 case GIMPLE_PREDICT:
4054 case GIMPLE_DEBUG:
4055 return 0;
4057 case GIMPLE_ASM:
4059 int count = asm_str_count (gimple_asm_string (stmt));
4060 /* 1000 means infinity. This avoids overflows later
4061 with very long asm statements. */
4062 if (count > 1000)
4063 count = 1000;
4064 return count;
4067 case GIMPLE_RESX:
4068 /* This is either going to be an external function call with one
4069 argument, or two register copy statements plus a goto. */
4070 return 2;
4072 case GIMPLE_EH_DISPATCH:
4073 /* ??? This is going to turn into a switch statement. Ideally
4074 we'd have a look at the eh region and estimate the number of
4075 edges involved. */
4076 return 10;
4078 case GIMPLE_BIND:
4079 return estimate_num_insns_seq (gimple_bind_body (stmt), weights);
4081 case GIMPLE_EH_FILTER:
4082 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt), weights);
4084 case GIMPLE_CATCH:
4085 return estimate_num_insns_seq (gimple_catch_handler (stmt), weights);
4087 case GIMPLE_TRY:
4088 return (estimate_num_insns_seq (gimple_try_eval (stmt), weights)
4089 + estimate_num_insns_seq (gimple_try_cleanup (stmt), weights));
4091 /* OpenMP directives are generally very expensive. */
4093 case GIMPLE_OMP_RETURN:
4094 case GIMPLE_OMP_SECTIONS_SWITCH:
4095 case GIMPLE_OMP_ATOMIC_STORE:
4096 case GIMPLE_OMP_CONTINUE:
4097 /* ...except these, which are cheap. */
4098 return 0;
4100 case GIMPLE_OMP_ATOMIC_LOAD:
4101 return weights->omp_cost;
4103 case GIMPLE_OMP_FOR:
4104 return (weights->omp_cost
4105 + estimate_num_insns_seq (gimple_omp_body (stmt), weights)
4106 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt), weights));
4108 case GIMPLE_OMP_PARALLEL:
4109 case GIMPLE_OMP_TASK:
4110 case GIMPLE_OMP_CRITICAL:
4111 case GIMPLE_OMP_MASTER:
4112 case GIMPLE_OMP_TASKGROUP:
4113 case GIMPLE_OMP_ORDERED:
4114 case GIMPLE_OMP_SECTION:
4115 case GIMPLE_OMP_SECTIONS:
4116 case GIMPLE_OMP_SINGLE:
4117 case GIMPLE_OMP_TARGET:
4118 case GIMPLE_OMP_TEAMS:
4119 return (weights->omp_cost
4120 + estimate_num_insns_seq (gimple_omp_body (stmt), weights));
4122 case GIMPLE_TRANSACTION:
4123 return (weights->tm_cost
4124 + estimate_num_insns_seq (gimple_transaction_body (stmt),
4125 weights));
4127 default:
4128 gcc_unreachable ();
4131 return cost;
4134 /* Estimate number of instructions that will be created by expanding
4135 function FNDECL. WEIGHTS contains weights attributed to various
4136 constructs. */
4139 estimate_num_insns_fn (tree fndecl, eni_weights *weights)
4141 struct function *my_function = DECL_STRUCT_FUNCTION (fndecl);
4142 gimple_stmt_iterator bsi;
4143 basic_block bb;
4144 int n = 0;
4146 gcc_assert (my_function && my_function->cfg);
4147 FOR_EACH_BB_FN (bb, my_function)
4149 for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
4150 n += estimate_num_insns (gsi_stmt (bsi), weights);
4153 return n;
4157 /* Initializes weights used by estimate_num_insns. */
4159 void
4160 init_inline_once (void)
4162 eni_size_weights.call_cost = 1;
4163 eni_size_weights.indirect_call_cost = 3;
4164 eni_size_weights.target_builtin_call_cost = 1;
4165 eni_size_weights.div_mod_cost = 1;
4166 eni_size_weights.omp_cost = 40;
4167 eni_size_weights.tm_cost = 10;
4168 eni_size_weights.time_based = false;
4169 eni_size_weights.return_cost = 1;
4171 /* Estimating time for call is difficult, since we have no idea what the
4172 called function does. In the current uses of eni_time_weights,
4173 underestimating the cost does less harm than overestimating it, so
4174 we choose a rather small value here. */
4175 eni_time_weights.call_cost = 10;
4176 eni_time_weights.indirect_call_cost = 15;
4177 eni_time_weights.target_builtin_call_cost = 1;
4178 eni_time_weights.div_mod_cost = 10;
4179 eni_time_weights.omp_cost = 40;
4180 eni_time_weights.tm_cost = 40;
4181 eni_time_weights.time_based = true;
4182 eni_time_weights.return_cost = 2;
4185 /* Estimate the number of instructions in a gimple_seq. */
4188 count_insns_seq (gimple_seq seq, eni_weights *weights)
4190 gimple_stmt_iterator gsi;
4191 int n = 0;
4192 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
4193 n += estimate_num_insns (gsi_stmt (gsi), weights);
4195 return n;
4199 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
4201 static void
4202 prepend_lexical_block (tree current_block, tree new_block)
4204 BLOCK_CHAIN (new_block) = BLOCK_SUBBLOCKS (current_block);
4205 BLOCK_SUBBLOCKS (current_block) = new_block;
4206 BLOCK_SUPERCONTEXT (new_block) = current_block;
4209 /* Add local variables from CALLEE to CALLER. */
4211 static inline void
4212 add_local_variables (struct function *callee, struct function *caller,
4213 copy_body_data *id)
4215 tree var;
4216 unsigned ix;
4218 FOR_EACH_LOCAL_DECL (callee, ix, var)
4219 if (!can_be_nonlocal (var, id))
4221 tree new_var = remap_decl (var, id);
4223 /* Remap debug-expressions. */
4224 if (TREE_CODE (new_var) == VAR_DECL
4225 && DECL_HAS_DEBUG_EXPR_P (var)
4226 && new_var != var)
4228 tree tem = DECL_DEBUG_EXPR (var);
4229 bool old_regimplify = id->regimplify;
4230 id->remapping_type_depth++;
4231 walk_tree (&tem, copy_tree_body_r, id, NULL);
4232 id->remapping_type_depth--;
4233 id->regimplify = old_regimplify;
4234 SET_DECL_DEBUG_EXPR (new_var, tem);
4235 DECL_HAS_DEBUG_EXPR_P (new_var) = 1;
4237 add_local_decl (caller, new_var);
4241 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
4243 static bool
4244 expand_call_inline (basic_block bb, gimple stmt, copy_body_data *id)
4246 tree use_retvar;
4247 tree fn;
4248 hash_map<tree, tree> *dst;
4249 hash_map<tree, tree> *st = NULL;
4250 tree return_slot;
4251 tree modify_dest;
4252 tree return_bounds = NULL;
4253 location_t saved_location;
4254 struct cgraph_edge *cg_edge;
4255 cgraph_inline_failed_t reason;
4256 basic_block return_block;
4257 edge e;
4258 gimple_stmt_iterator gsi, stmt_gsi;
4259 bool successfully_inlined = FALSE;
4260 bool purge_dead_abnormal_edges;
4261 unsigned int i;
4263 /* Set input_location here so we get the right instantiation context
4264 if we call instantiate_decl from inlinable_function_p. */
4265 /* FIXME: instantiate_decl isn't called by inlinable_function_p. */
4266 saved_location = input_location;
4267 input_location = gimple_location (stmt);
4269 /* From here on, we're only interested in CALL_EXPRs. */
4270 if (gimple_code (stmt) != GIMPLE_CALL)
4271 goto egress;
4273 cg_edge = id->dst_node->get_edge (stmt);
4274 gcc_checking_assert (cg_edge);
4275 /* First, see if we can figure out what function is being called.
4276 If we cannot, then there is no hope of inlining the function. */
4277 if (cg_edge->indirect_unknown_callee)
4278 goto egress;
4279 fn = cg_edge->callee->decl;
4280 gcc_checking_assert (fn);
4282 /* If FN is a declaration of a function in a nested scope that was
4283 globally declared inline, we don't set its DECL_INITIAL.
4284 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
4285 C++ front-end uses it for cdtors to refer to their internal
4286 declarations, that are not real functions. Fortunately those
4287 don't have trees to be saved, so we can tell by checking their
4288 gimple_body. */
4289 if (!DECL_INITIAL (fn)
4290 && DECL_ABSTRACT_ORIGIN (fn)
4291 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn)))
4292 fn = DECL_ABSTRACT_ORIGIN (fn);
4294 /* Don't try to inline functions that are not well-suited to inlining. */
4295 if (cg_edge->inline_failed)
4297 reason = cg_edge->inline_failed;
4298 /* If this call was originally indirect, we do not want to emit any
4299 inlining related warnings or sorry messages because there are no
4300 guarantees regarding those. */
4301 if (cg_edge->indirect_inlining_edge)
4302 goto egress;
4304 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn))
4305 /* For extern inline functions that get redefined we always
4306 silently ignored always_inline flag. Better behaviour would
4307 be to be able to keep both bodies and use extern inline body
4308 for inlining, but we can't do that because frontends overwrite
4309 the body. */
4310 && !cg_edge->callee->local.redefined_extern_inline
4311 /* During early inline pass, report only when optimization is
4312 not turned on. */
4313 && (symtab->global_info_ready
4314 || !optimize
4315 || cgraph_inline_failed_type (reason) == CIF_FINAL_ERROR)
4316 /* PR 20090218-1_0.c. Body can be provided by another module. */
4317 && (reason != CIF_BODY_NOT_AVAILABLE || !flag_generate_lto))
4319 error ("inlining failed in call to always_inline %q+F: %s", fn,
4320 cgraph_inline_failed_string (reason));
4321 error ("called from here");
4323 else if (warn_inline
4324 && DECL_DECLARED_INLINE_P (fn)
4325 && !DECL_NO_INLINE_WARNING_P (fn)
4326 && !DECL_IN_SYSTEM_HEADER (fn)
4327 && reason != CIF_UNSPECIFIED
4328 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn))
4329 /* Do not warn about not inlined recursive calls. */
4330 && !cg_edge->recursive_p ()
4331 /* Avoid warnings during early inline pass. */
4332 && symtab->global_info_ready)
4334 warning (OPT_Winline, "inlining failed in call to %q+F: %s",
4335 fn, _(cgraph_inline_failed_string (reason)));
4336 warning (OPT_Winline, "called from here");
4338 goto egress;
4340 fn = cg_edge->callee->decl;
4341 cg_edge->callee->get_untransformed_body ();
4343 #ifdef ENABLE_CHECKING
4344 if (cg_edge->callee->decl != id->dst_node->decl)
4345 cg_edge->callee->verify ();
4346 #endif
4348 /* We will be inlining this callee. */
4349 id->eh_lp_nr = lookup_stmt_eh_lp (stmt);
4350 id->assign_stmts.create (0);
4352 /* Update the callers EH personality. */
4353 if (DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl))
4354 DECL_FUNCTION_PERSONALITY (cg_edge->caller->decl)
4355 = DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl);
4357 /* Split the block holding the GIMPLE_CALL. */
4358 e = split_block (bb, stmt);
4359 bb = e->src;
4360 return_block = e->dest;
4361 remove_edge (e);
4363 /* split_block splits after the statement; work around this by
4364 moving the call into the second block manually. Not pretty,
4365 but seems easier than doing the CFG manipulation by hand
4366 when the GIMPLE_CALL is in the last statement of BB. */
4367 stmt_gsi = gsi_last_bb (bb);
4368 gsi_remove (&stmt_gsi, false);
4370 /* If the GIMPLE_CALL was in the last statement of BB, it may have
4371 been the source of abnormal edges. In this case, schedule
4372 the removal of dead abnormal edges. */
4373 gsi = gsi_start_bb (return_block);
4374 if (gsi_end_p (gsi))
4376 gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
4377 purge_dead_abnormal_edges = true;
4379 else
4381 gsi_insert_before (&gsi, stmt, GSI_NEW_STMT);
4382 purge_dead_abnormal_edges = false;
4385 stmt_gsi = gsi_start_bb (return_block);
4387 /* Build a block containing code to initialize the arguments, the
4388 actual inline expansion of the body, and a label for the return
4389 statements within the function to jump to. The type of the
4390 statement expression is the return type of the function call.
4391 ??? If the call does not have an associated block then we will
4392 remap all callee blocks to NULL, effectively dropping most of
4393 its debug information. This should only happen for calls to
4394 artificial decls inserted by the compiler itself. We need to
4395 either link the inlined blocks into the caller block tree or
4396 not refer to them in any way to not break GC for locations. */
4397 if (gimple_block (stmt))
4399 id->block = make_node (BLOCK);
4400 BLOCK_ABSTRACT_ORIGIN (id->block) = fn;
4401 BLOCK_SOURCE_LOCATION (id->block) = LOCATION_LOCUS (input_location);
4402 prepend_lexical_block (gimple_block (stmt), id->block);
4405 /* Local declarations will be replaced by their equivalents in this
4406 map. */
4407 st = id->decl_map;
4408 id->decl_map = new hash_map<tree, tree>;
4409 dst = id->debug_map;
4410 id->debug_map = NULL;
4412 /* Record the function we are about to inline. */
4413 id->src_fn = fn;
4414 id->src_node = cg_edge->callee;
4415 id->src_cfun = DECL_STRUCT_FUNCTION (fn);
4416 id->gimple_call = stmt;
4418 gcc_assert (!id->src_cfun->after_inlining);
4420 id->entry_bb = bb;
4421 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn)))
4423 gimple_stmt_iterator si = gsi_last_bb (bb);
4424 gsi_insert_after (&si, gimple_build_predict (PRED_COLD_FUNCTION,
4425 NOT_TAKEN),
4426 GSI_NEW_STMT);
4428 initialize_inlined_parameters (id, stmt, fn, bb);
4430 if (DECL_INITIAL (fn))
4432 if (gimple_block (stmt))
4434 tree *var;
4436 prepend_lexical_block (id->block,
4437 remap_blocks (DECL_INITIAL (fn), id));
4438 gcc_checking_assert (BLOCK_SUBBLOCKS (id->block)
4439 && (BLOCK_CHAIN (BLOCK_SUBBLOCKS (id->block))
4440 == NULL_TREE));
4441 /* Move vars for PARM_DECLs from DECL_INITIAL block to id->block,
4442 otherwise for DWARF DW_TAG_formal_parameter will not be children of
4443 DW_TAG_inlined_subroutine, but of a DW_TAG_lexical_block
4444 under it. The parameters can be then evaluated in the debugger,
4445 but don't show in backtraces. */
4446 for (var = &BLOCK_VARS (BLOCK_SUBBLOCKS (id->block)); *var; )
4447 if (TREE_CODE (DECL_ORIGIN (*var)) == PARM_DECL)
4449 tree v = *var;
4450 *var = TREE_CHAIN (v);
4451 TREE_CHAIN (v) = BLOCK_VARS (id->block);
4452 BLOCK_VARS (id->block) = v;
4454 else
4455 var = &TREE_CHAIN (*var);
4457 else
4458 remap_blocks_to_null (DECL_INITIAL (fn), id);
4461 /* Return statements in the function body will be replaced by jumps
4462 to the RET_LABEL. */
4463 gcc_assert (DECL_INITIAL (fn));
4464 gcc_assert (TREE_CODE (DECL_INITIAL (fn)) == BLOCK);
4466 /* Find the LHS to which the result of this call is assigned. */
4467 return_slot = NULL;
4468 if (gimple_call_lhs (stmt))
4470 modify_dest = gimple_call_lhs (stmt);
4472 /* Remember where to copy returned bounds. */
4473 if (gimple_call_with_bounds_p (stmt)
4474 && TREE_CODE (modify_dest) == SSA_NAME)
4476 gimple retbnd = chkp_retbnd_call_by_val (modify_dest);
4477 if (retbnd)
4479 return_bounds = gimple_call_lhs (retbnd);
4480 /* If returned bounds are not used then just
4481 remove unused call. */
4482 if (!return_bounds)
4484 gimple_stmt_iterator iter = gsi_for_stmt (retbnd);
4485 gsi_remove (&iter, true);
4490 /* The function which we are inlining might not return a value,
4491 in which case we should issue a warning that the function
4492 does not return a value. In that case the optimizers will
4493 see that the variable to which the value is assigned was not
4494 initialized. We do not want to issue a warning about that
4495 uninitialized variable. */
4496 if (DECL_P (modify_dest))
4497 TREE_NO_WARNING (modify_dest) = 1;
4499 if (gimple_call_return_slot_opt_p (stmt))
4501 return_slot = modify_dest;
4502 modify_dest = NULL;
4505 else
4506 modify_dest = NULL;
4508 /* If we are inlining a call to the C++ operator new, we don't want
4509 to use type based alias analysis on the return value. Otherwise
4510 we may get confused if the compiler sees that the inlined new
4511 function returns a pointer which was just deleted. See bug
4512 33407. */
4513 if (DECL_IS_OPERATOR_NEW (fn))
4515 return_slot = NULL;
4516 modify_dest = NULL;
4519 /* Declare the return variable for the function. */
4520 use_retvar = declare_return_variable (id, return_slot, modify_dest,
4521 return_bounds, bb);
4523 /* Add local vars in this inlined callee to caller. */
4524 add_local_variables (id->src_cfun, cfun, id);
4526 if (dump_file && (dump_flags & TDF_DETAILS))
4528 fprintf (dump_file, "Inlining ");
4529 print_generic_expr (dump_file, id->src_fn, 0);
4530 fprintf (dump_file, " to ");
4531 print_generic_expr (dump_file, id->dst_fn, 0);
4532 fprintf (dump_file, " with frequency %i\n", cg_edge->frequency);
4535 /* This is it. Duplicate the callee body. Assume callee is
4536 pre-gimplified. Note that we must not alter the caller
4537 function in any way before this point, as this CALL_EXPR may be
4538 a self-referential call; if we're calling ourselves, we need to
4539 duplicate our body before altering anything. */
4540 copy_body (id, cg_edge->callee->count,
4541 GCOV_COMPUTE_SCALE (cg_edge->frequency, CGRAPH_FREQ_BASE),
4542 bb, return_block, NULL);
4544 /* Reset the escaped solution. */
4545 if (cfun->gimple_df)
4546 pt_solution_reset (&cfun->gimple_df->escaped);
4548 /* Clean up. */
4549 if (id->debug_map)
4551 delete id->debug_map;
4552 id->debug_map = dst;
4554 delete id->decl_map;
4555 id->decl_map = st;
4557 /* Unlink the calls virtual operands before replacing it. */
4558 unlink_stmt_vdef (stmt);
4559 if (gimple_vdef (stmt)
4560 && TREE_CODE (gimple_vdef (stmt)) == SSA_NAME)
4561 release_ssa_name (gimple_vdef (stmt));
4563 /* If the inlined function returns a result that we care about,
4564 substitute the GIMPLE_CALL with an assignment of the return
4565 variable to the LHS of the call. That is, if STMT was
4566 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4567 if (use_retvar && gimple_call_lhs (stmt))
4569 gimple old_stmt = stmt;
4570 stmt = gimple_build_assign (gimple_call_lhs (stmt), use_retvar);
4571 gsi_replace (&stmt_gsi, stmt, false);
4572 maybe_clean_or_replace_eh_stmt (old_stmt, stmt);
4574 /* Copy bounds if we copy structure with bounds. */
4575 if (chkp_function_instrumented_p (id->dst_fn)
4576 && !BOUNDED_P (use_retvar)
4577 && chkp_type_has_pointer (TREE_TYPE (use_retvar)))
4578 id->assign_stmts.safe_push (stmt);
4580 else
4582 /* Handle the case of inlining a function with no return
4583 statement, which causes the return value to become undefined. */
4584 if (gimple_call_lhs (stmt)
4585 && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
4587 tree name = gimple_call_lhs (stmt);
4588 tree var = SSA_NAME_VAR (name);
4589 tree def = ssa_default_def (cfun, var);
4591 if (def)
4593 /* If the variable is used undefined, make this name
4594 undefined via a move. */
4595 stmt = gimple_build_assign (gimple_call_lhs (stmt), def);
4596 gsi_replace (&stmt_gsi, stmt, true);
4598 else
4600 /* Otherwise make this variable undefined. */
4601 gsi_remove (&stmt_gsi, true);
4602 set_ssa_default_def (cfun, var, name);
4603 SSA_NAME_DEF_STMT (name) = gimple_build_nop ();
4606 else
4607 gsi_remove (&stmt_gsi, true);
4610 /* Put returned bounds into the correct place if required. */
4611 if (return_bounds)
4613 gimple old_stmt = SSA_NAME_DEF_STMT (return_bounds);
4614 gimple new_stmt = gimple_build_assign (return_bounds, id->retbnd);
4615 gimple_stmt_iterator bnd_gsi = gsi_for_stmt (old_stmt);
4616 unlink_stmt_vdef (old_stmt);
4617 gsi_replace (&bnd_gsi, new_stmt, false);
4618 maybe_clean_or_replace_eh_stmt (old_stmt, new_stmt);
4619 cgraph_update_edges_for_call_stmt (old_stmt,
4620 gimple_call_fndecl (old_stmt),
4621 new_stmt);
4624 if (purge_dead_abnormal_edges)
4626 gimple_purge_dead_eh_edges (return_block);
4627 gimple_purge_dead_abnormal_call_edges (return_block);
4630 /* If the value of the new expression is ignored, that's OK. We
4631 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4632 the equivalent inlined version either. */
4633 if (is_gimple_assign (stmt))
4635 gcc_assert (gimple_assign_single_p (stmt)
4636 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt)));
4637 TREE_USED (gimple_assign_rhs1 (stmt)) = 1;
4640 /* Copy bounds for all generated assigns that need it. */
4641 for (i = 0; i < id->assign_stmts.length (); i++)
4642 chkp_copy_bounds_for_assign (id->assign_stmts[i], cg_edge);
4643 id->assign_stmts.release ();
4645 /* Output the inlining info for this abstract function, since it has been
4646 inlined. If we don't do this now, we can lose the information about the
4647 variables in the function when the blocks get blown away as soon as we
4648 remove the cgraph node. */
4649 if (gimple_block (stmt))
4650 (*debug_hooks->outlining_inline_function) (cg_edge->callee->decl);
4652 /* Update callgraph if needed. */
4653 cg_edge->callee->remove ();
4655 id->block = NULL_TREE;
4656 successfully_inlined = TRUE;
4658 egress:
4659 input_location = saved_location;
4660 return successfully_inlined;
4663 /* Expand call statements reachable from STMT_P.
4664 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4665 in a MODIFY_EXPR. */
4667 static bool
4668 gimple_expand_calls_inline (basic_block bb, copy_body_data *id)
4670 gimple_stmt_iterator gsi;
4672 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4674 gimple stmt = gsi_stmt (gsi);
4676 if (is_gimple_call (stmt)
4677 && !gimple_call_internal_p (stmt)
4678 && expand_call_inline (bb, stmt, id))
4679 return true;
4682 return false;
4686 /* Walk all basic blocks created after FIRST and try to fold every statement
4687 in the STATEMENTS pointer set. */
4689 static void
4690 fold_marked_statements (int first, hash_set<gimple> *statements)
4692 for (; first < n_basic_blocks_for_fn (cfun); first++)
4693 if (BASIC_BLOCK_FOR_FN (cfun, first))
4695 gimple_stmt_iterator gsi;
4697 for (gsi = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4698 !gsi_end_p (gsi);
4699 gsi_next (&gsi))
4700 if (statements->contains (gsi_stmt (gsi)))
4702 gimple old_stmt = gsi_stmt (gsi);
4703 tree old_decl = is_gimple_call (old_stmt) ? gimple_call_fndecl (old_stmt) : 0;
4705 if (old_decl && DECL_BUILT_IN (old_decl))
4707 /* Folding builtins can create multiple instructions,
4708 we need to look at all of them. */
4709 gimple_stmt_iterator i2 = gsi;
4710 gsi_prev (&i2);
4711 if (fold_stmt (&gsi))
4713 gimple new_stmt;
4714 /* If a builtin at the end of a bb folded into nothing,
4715 the following loop won't work. */
4716 if (gsi_end_p (gsi))
4718 cgraph_update_edges_for_call_stmt (old_stmt,
4719 old_decl, NULL);
4720 break;
4722 if (gsi_end_p (i2))
4723 i2 = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4724 else
4725 gsi_next (&i2);
4726 while (1)
4728 new_stmt = gsi_stmt (i2);
4729 update_stmt (new_stmt);
4730 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4731 new_stmt);
4733 if (new_stmt == gsi_stmt (gsi))
4735 /* It is okay to check only for the very last
4736 of these statements. If it is a throwing
4737 statement nothing will change. If it isn't
4738 this can remove EH edges. If that weren't
4739 correct then because some intermediate stmts
4740 throw, but not the last one. That would mean
4741 we'd have to split the block, which we can't
4742 here and we'd loose anyway. And as builtins
4743 probably never throw, this all
4744 is mood anyway. */
4745 if (maybe_clean_or_replace_eh_stmt (old_stmt,
4746 new_stmt))
4747 gimple_purge_dead_eh_edges (
4748 BASIC_BLOCK_FOR_FN (cfun, first));
4749 break;
4751 gsi_next (&i2);
4755 else if (fold_stmt (&gsi))
4757 /* Re-read the statement from GSI as fold_stmt() may
4758 have changed it. */
4759 gimple new_stmt = gsi_stmt (gsi);
4760 update_stmt (new_stmt);
4762 if (is_gimple_call (old_stmt)
4763 || is_gimple_call (new_stmt))
4764 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4765 new_stmt);
4767 if (maybe_clean_or_replace_eh_stmt (old_stmt, new_stmt))
4768 gimple_purge_dead_eh_edges (BASIC_BLOCK_FOR_FN (cfun,
4769 first));
4775 /* Expand calls to inline functions in the body of FN. */
4777 unsigned int
4778 optimize_inline_calls (tree fn)
4780 copy_body_data id;
4781 basic_block bb;
4782 int last = n_basic_blocks_for_fn (cfun);
4783 bool inlined_p = false;
4785 /* Clear out ID. */
4786 memset (&id, 0, sizeof (id));
4788 id.src_node = id.dst_node = cgraph_node::get (fn);
4789 gcc_assert (id.dst_node->definition);
4790 id.dst_fn = fn;
4791 /* Or any functions that aren't finished yet. */
4792 if (current_function_decl)
4793 id.dst_fn = current_function_decl;
4795 id.copy_decl = copy_decl_maybe_to_var;
4796 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4797 id.transform_new_cfg = false;
4798 id.transform_return_to_modify = true;
4799 id.transform_parameter = true;
4800 id.transform_lang_insert_block = NULL;
4801 id.statements_to_fold = new hash_set<gimple>;
4803 push_gimplify_context ();
4805 /* We make no attempts to keep dominance info up-to-date. */
4806 free_dominance_info (CDI_DOMINATORS);
4807 free_dominance_info (CDI_POST_DOMINATORS);
4809 /* Register specific gimple functions. */
4810 gimple_register_cfg_hooks ();
4812 /* Reach the trees by walking over the CFG, and note the
4813 enclosing basic-blocks in the call edges. */
4814 /* We walk the blocks going forward, because inlined function bodies
4815 will split id->current_basic_block, and the new blocks will
4816 follow it; we'll trudge through them, processing their CALL_EXPRs
4817 along the way. */
4818 FOR_EACH_BB_FN (bb, cfun)
4819 inlined_p |= gimple_expand_calls_inline (bb, &id);
4821 pop_gimplify_context (NULL);
4823 #ifdef ENABLE_CHECKING
4825 struct cgraph_edge *e;
4827 id.dst_node->verify ();
4829 /* Double check that we inlined everything we are supposed to inline. */
4830 for (e = id.dst_node->callees; e; e = e->next_callee)
4831 gcc_assert (e->inline_failed);
4833 #endif
4835 /* Fold queued statements. */
4836 fold_marked_statements (last, id.statements_to_fold);
4837 delete id.statements_to_fold;
4839 gcc_assert (!id.debug_stmts.exists ());
4841 /* If we didn't inline into the function there is nothing to do. */
4842 if (!inlined_p)
4843 return 0;
4845 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4846 number_blocks (fn);
4848 delete_unreachable_blocks_update_callgraph (&id);
4849 #ifdef ENABLE_CHECKING
4850 id.dst_node->verify ();
4851 #endif
4853 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4854 not possible yet - the IPA passes might make various functions to not
4855 throw and they don't care to proactively update local EH info. This is
4856 done later in fixup_cfg pass that also execute the verification. */
4857 return (TODO_update_ssa
4858 | TODO_cleanup_cfg
4859 | (gimple_in_ssa_p (cfun) ? TODO_remove_unused_locals : 0)
4860 | (gimple_in_ssa_p (cfun) ? TODO_update_address_taken : 0)
4861 | (profile_status_for_fn (cfun) != PROFILE_ABSENT
4862 ? TODO_rebuild_frequencies : 0));
4865 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4867 tree
4868 copy_tree_r (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
4870 enum tree_code code = TREE_CODE (*tp);
4871 enum tree_code_class cl = TREE_CODE_CLASS (code);
4873 /* We make copies of most nodes. */
4874 if (IS_EXPR_CODE_CLASS (cl)
4875 || code == TREE_LIST
4876 || code == TREE_VEC
4877 || code == TYPE_DECL
4878 || code == OMP_CLAUSE)
4880 /* Because the chain gets clobbered when we make a copy, we save it
4881 here. */
4882 tree chain = NULL_TREE, new_tree;
4884 if (CODE_CONTAINS_STRUCT (code, TS_COMMON))
4885 chain = TREE_CHAIN (*tp);
4887 /* Copy the node. */
4888 new_tree = copy_node (*tp);
4890 *tp = new_tree;
4892 /* Now, restore the chain, if appropriate. That will cause
4893 walk_tree to walk into the chain as well. */
4894 if (code == PARM_DECL
4895 || code == TREE_LIST
4896 || code == OMP_CLAUSE)
4897 TREE_CHAIN (*tp) = chain;
4899 /* For now, we don't update BLOCKs when we make copies. So, we
4900 have to nullify all BIND_EXPRs. */
4901 if (TREE_CODE (*tp) == BIND_EXPR)
4902 BIND_EXPR_BLOCK (*tp) = NULL_TREE;
4904 else if (code == CONSTRUCTOR)
4906 /* CONSTRUCTOR nodes need special handling because
4907 we need to duplicate the vector of elements. */
4908 tree new_tree;
4910 new_tree = copy_node (*tp);
4911 CONSTRUCTOR_ELTS (new_tree) = vec_safe_copy (CONSTRUCTOR_ELTS (*tp));
4912 *tp = new_tree;
4914 else if (code == STATEMENT_LIST)
4915 /* We used to just abort on STATEMENT_LIST, but we can run into them
4916 with statement-expressions (c++/40975). */
4917 copy_statement_list (tp);
4918 else if (TREE_CODE_CLASS (code) == tcc_type)
4919 *walk_subtrees = 0;
4920 else if (TREE_CODE_CLASS (code) == tcc_declaration)
4921 *walk_subtrees = 0;
4922 else if (TREE_CODE_CLASS (code) == tcc_constant)
4923 *walk_subtrees = 0;
4924 return NULL_TREE;
4927 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4928 information indicating to what new SAVE_EXPR this one should be mapped,
4929 use that one. Otherwise, create a new node and enter it in ST. FN is
4930 the function into which the copy will be placed. */
4932 static void
4933 remap_save_expr (tree *tp, hash_map<tree, tree> *st, int *walk_subtrees)
4935 tree *n;
4936 tree t;
4938 /* See if we already encountered this SAVE_EXPR. */
4939 n = st->get (*tp);
4941 /* If we didn't already remap this SAVE_EXPR, do so now. */
4942 if (!n)
4944 t = copy_node (*tp);
4946 /* Remember this SAVE_EXPR. */
4947 st->put (*tp, t);
4948 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4949 st->put (t, t);
4951 else
4953 /* We've already walked into this SAVE_EXPR; don't do it again. */
4954 *walk_subtrees = 0;
4955 t = *n;
4958 /* Replace this SAVE_EXPR with the copy. */
4959 *tp = t;
4962 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4963 label, copies the declaration and enters it in the splay_tree in DATA (which
4964 is really a 'copy_body_data *'. */
4966 static tree
4967 mark_local_labels_stmt (gimple_stmt_iterator *gsip,
4968 bool *handled_ops_p ATTRIBUTE_UNUSED,
4969 struct walk_stmt_info *wi)
4971 copy_body_data *id = (copy_body_data *) wi->info;
4972 gimple stmt = gsi_stmt (*gsip);
4974 if (gimple_code (stmt) == GIMPLE_LABEL)
4976 tree decl = gimple_label_label (stmt);
4978 /* Copy the decl and remember the copy. */
4979 insert_decl_map (id, decl, id->copy_decl (decl, id));
4982 return NULL_TREE;
4986 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4987 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4988 remaps all local declarations to appropriate replacements in gimple
4989 operands. */
4991 static tree
4992 replace_locals_op (tree *tp, int *walk_subtrees, void *data)
4994 struct walk_stmt_info *wi = (struct walk_stmt_info*) data;
4995 copy_body_data *id = (copy_body_data *) wi->info;
4996 hash_map<tree, tree> *st = id->decl_map;
4997 tree *n;
4998 tree expr = *tp;
5000 /* Only a local declaration (variable or label). */
5001 if ((TREE_CODE (expr) == VAR_DECL
5002 && !TREE_STATIC (expr))
5003 || TREE_CODE (expr) == LABEL_DECL)
5005 /* Lookup the declaration. */
5006 n = st->get (expr);
5008 /* If it's there, remap it. */
5009 if (n)
5010 *tp = *n;
5011 *walk_subtrees = 0;
5013 else if (TREE_CODE (expr) == STATEMENT_LIST
5014 || TREE_CODE (expr) == BIND_EXPR
5015 || TREE_CODE (expr) == SAVE_EXPR)
5016 gcc_unreachable ();
5017 else if (TREE_CODE (expr) == TARGET_EXPR)
5019 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
5020 It's OK for this to happen if it was part of a subtree that
5021 isn't immediately expanded, such as operand 2 of another
5022 TARGET_EXPR. */
5023 if (!TREE_OPERAND (expr, 1))
5025 TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3);
5026 TREE_OPERAND (expr, 3) = NULL_TREE;
5030 /* Keep iterating. */
5031 return NULL_TREE;
5035 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
5036 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
5037 remaps all local declarations to appropriate replacements in gimple
5038 statements. */
5040 static tree
5041 replace_locals_stmt (gimple_stmt_iterator *gsip,
5042 bool *handled_ops_p ATTRIBUTE_UNUSED,
5043 struct walk_stmt_info *wi)
5045 copy_body_data *id = (copy_body_data *) wi->info;
5046 gimple stmt = gsi_stmt (*gsip);
5048 if (gimple_code (stmt) == GIMPLE_BIND)
5050 tree block = gimple_bind_block (stmt);
5052 if (block)
5054 remap_block (&block, id);
5055 gimple_bind_set_block (stmt, block);
5058 /* This will remap a lot of the same decls again, but this should be
5059 harmless. */
5060 if (gimple_bind_vars (stmt))
5061 gimple_bind_set_vars (stmt, remap_decls (gimple_bind_vars (stmt),
5062 NULL, id));
5065 /* Keep iterating. */
5066 return NULL_TREE;
5070 /* Copies everything in SEQ and replaces variables and labels local to
5071 current_function_decl. */
5073 gimple_seq
5074 copy_gimple_seq_and_replace_locals (gimple_seq seq)
5076 copy_body_data id;
5077 struct walk_stmt_info wi;
5078 gimple_seq copy;
5080 /* There's nothing to do for NULL_TREE. */
5081 if (seq == NULL)
5082 return seq;
5084 /* Set up ID. */
5085 memset (&id, 0, sizeof (id));
5086 id.src_fn = current_function_decl;
5087 id.dst_fn = current_function_decl;
5088 id.decl_map = new hash_map<tree, tree>;
5089 id.debug_map = NULL;
5091 id.copy_decl = copy_decl_no_change;
5092 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
5093 id.transform_new_cfg = false;
5094 id.transform_return_to_modify = false;
5095 id.transform_parameter = false;
5096 id.transform_lang_insert_block = NULL;
5098 /* Walk the tree once to find local labels. */
5099 memset (&wi, 0, sizeof (wi));
5100 hash_set<tree> visited;
5101 wi.info = &id;
5102 wi.pset = &visited;
5103 walk_gimple_seq (seq, mark_local_labels_stmt, NULL, &wi);
5105 copy = gimple_seq_copy (seq);
5107 /* Walk the copy, remapping decls. */
5108 memset (&wi, 0, sizeof (wi));
5109 wi.info = &id;
5110 walk_gimple_seq (copy, replace_locals_stmt, replace_locals_op, &wi);
5112 /* Clean up. */
5113 delete id.decl_map;
5114 if (id.debug_map)
5115 delete id.debug_map;
5117 return copy;
5121 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
5123 static tree
5124 debug_find_tree_1 (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED, void *data)
5126 if (*tp == data)
5127 return (tree) data;
5128 else
5129 return NULL;
5132 DEBUG_FUNCTION bool
5133 debug_find_tree (tree top, tree search)
5135 return walk_tree_without_duplicates (&top, debug_find_tree_1, search) != 0;
5139 /* Declare the variables created by the inliner. Add all the variables in
5140 VARS to BIND_EXPR. */
5142 static void
5143 declare_inline_vars (tree block, tree vars)
5145 tree t;
5146 for (t = vars; t; t = DECL_CHAIN (t))
5148 DECL_SEEN_IN_BIND_EXPR_P (t) = 1;
5149 gcc_assert (!TREE_STATIC (t) && !TREE_ASM_WRITTEN (t));
5150 add_local_decl (cfun, t);
5153 if (block)
5154 BLOCK_VARS (block) = chainon (BLOCK_VARS (block), vars);
5157 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
5158 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
5159 VAR_DECL translation. */
5161 static tree
5162 copy_decl_for_dup_finish (copy_body_data *id, tree decl, tree copy)
5164 /* Don't generate debug information for the copy if we wouldn't have
5165 generated it for the copy either. */
5166 DECL_ARTIFICIAL (copy) = DECL_ARTIFICIAL (decl);
5167 DECL_IGNORED_P (copy) = DECL_IGNORED_P (decl);
5169 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
5170 declaration inspired this copy. */
5171 DECL_ABSTRACT_ORIGIN (copy) = DECL_ORIGIN (decl);
5173 /* The new variable/label has no RTL, yet. */
5174 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy), TS_DECL_WRTL)
5175 && !TREE_STATIC (copy) && !DECL_EXTERNAL (copy))
5176 SET_DECL_RTL (copy, 0);
5178 /* These args would always appear unused, if not for this. */
5179 TREE_USED (copy) = 1;
5181 /* Set the context for the new declaration. */
5182 if (!DECL_CONTEXT (decl))
5183 /* Globals stay global. */
5185 else if (DECL_CONTEXT (decl) != id->src_fn)
5186 /* Things that weren't in the scope of the function we're inlining
5187 from aren't in the scope we're inlining to, either. */
5189 else if (TREE_STATIC (decl))
5190 /* Function-scoped static variables should stay in the original
5191 function. */
5193 else
5194 /* Ordinary automatic local variables are now in the scope of the
5195 new function. */
5196 DECL_CONTEXT (copy) = id->dst_fn;
5198 return copy;
5201 static tree
5202 copy_decl_to_var (tree decl, copy_body_data *id)
5204 tree copy, type;
5206 gcc_assert (TREE_CODE (decl) == PARM_DECL
5207 || TREE_CODE (decl) == RESULT_DECL);
5209 type = TREE_TYPE (decl);
5211 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5212 VAR_DECL, DECL_NAME (decl), type);
5213 if (DECL_PT_UID_SET_P (decl))
5214 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5215 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5216 TREE_READONLY (copy) = TREE_READONLY (decl);
5217 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5218 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5220 return copy_decl_for_dup_finish (id, decl, copy);
5223 /* Like copy_decl_to_var, but create a return slot object instead of a
5224 pointer variable for return by invisible reference. */
5226 static tree
5227 copy_result_decl_to_var (tree decl, copy_body_data *id)
5229 tree copy, type;
5231 gcc_assert (TREE_CODE (decl) == PARM_DECL
5232 || TREE_CODE (decl) == RESULT_DECL);
5234 type = TREE_TYPE (decl);
5235 if (DECL_BY_REFERENCE (decl))
5236 type = TREE_TYPE (type);
5238 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5239 VAR_DECL, DECL_NAME (decl), type);
5240 if (DECL_PT_UID_SET_P (decl))
5241 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5242 TREE_READONLY (copy) = TREE_READONLY (decl);
5243 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5244 if (!DECL_BY_REFERENCE (decl))
5246 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5247 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5250 return copy_decl_for_dup_finish (id, decl, copy);
5253 tree
5254 copy_decl_no_change (tree decl, copy_body_data *id)
5256 tree copy;
5258 copy = copy_node (decl);
5260 /* The COPY is not abstract; it will be generated in DST_FN. */
5261 DECL_ABSTRACT_P (copy) = false;
5262 lang_hooks.dup_lang_specific_decl (copy);
5264 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
5265 been taken; it's for internal bookkeeping in expand_goto_internal. */
5266 if (TREE_CODE (copy) == LABEL_DECL)
5268 TREE_ADDRESSABLE (copy) = 0;
5269 LABEL_DECL_UID (copy) = -1;
5272 return copy_decl_for_dup_finish (id, decl, copy);
5275 static tree
5276 copy_decl_maybe_to_var (tree decl, copy_body_data *id)
5278 if (TREE_CODE (decl) == PARM_DECL || TREE_CODE (decl) == RESULT_DECL)
5279 return copy_decl_to_var (decl, id);
5280 else
5281 return copy_decl_no_change (decl, id);
5284 /* Return a copy of the function's argument tree. */
5285 static tree
5286 copy_arguments_for_versioning (tree orig_parm, copy_body_data * id,
5287 bitmap args_to_skip, tree *vars)
5289 tree arg, *parg;
5290 tree new_parm = NULL;
5291 int i = 0;
5293 parg = &new_parm;
5295 for (arg = orig_parm; arg; arg = DECL_CHAIN (arg), i++)
5296 if (!args_to_skip || !bitmap_bit_p (args_to_skip, i))
5298 tree new_tree = remap_decl (arg, id);
5299 if (TREE_CODE (new_tree) != PARM_DECL)
5300 new_tree = id->copy_decl (arg, id);
5301 lang_hooks.dup_lang_specific_decl (new_tree);
5302 *parg = new_tree;
5303 parg = &DECL_CHAIN (new_tree);
5305 else if (!id->decl_map->get (arg))
5307 /* Make an equivalent VAR_DECL. If the argument was used
5308 as temporary variable later in function, the uses will be
5309 replaced by local variable. */
5310 tree var = copy_decl_to_var (arg, id);
5311 insert_decl_map (id, arg, var);
5312 /* Declare this new variable. */
5313 DECL_CHAIN (var) = *vars;
5314 *vars = var;
5316 return new_parm;
5319 /* Return a copy of the function's static chain. */
5320 static tree
5321 copy_static_chain (tree static_chain, copy_body_data * id)
5323 tree *chain_copy, *pvar;
5325 chain_copy = &static_chain;
5326 for (pvar = chain_copy; *pvar; pvar = &DECL_CHAIN (*pvar))
5328 tree new_tree = remap_decl (*pvar, id);
5329 lang_hooks.dup_lang_specific_decl (new_tree);
5330 DECL_CHAIN (new_tree) = DECL_CHAIN (*pvar);
5331 *pvar = new_tree;
5333 return static_chain;
5336 /* Return true if the function is allowed to be versioned.
5337 This is a guard for the versioning functionality. */
5339 bool
5340 tree_versionable_function_p (tree fndecl)
5342 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl))
5343 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl), fndecl) == NULL);
5346 /* Delete all unreachable basic blocks and update callgraph.
5347 Doing so is somewhat nontrivial because we need to update all clones and
5348 remove inline function that become unreachable. */
5350 static bool
5351 delete_unreachable_blocks_update_callgraph (copy_body_data *id)
5353 bool changed = false;
5354 basic_block b, next_bb;
5356 find_unreachable_blocks ();
5358 /* Delete all unreachable basic blocks. */
5360 for (b = ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb; b
5361 != EXIT_BLOCK_PTR_FOR_FN (cfun); b = next_bb)
5363 next_bb = b->next_bb;
5365 if (!(b->flags & BB_REACHABLE))
5367 gimple_stmt_iterator bsi;
5369 for (bsi = gsi_start_bb (b); !gsi_end_p (bsi); gsi_next (&bsi))
5371 struct cgraph_edge *e;
5372 struct cgraph_node *node;
5374 id->dst_node->remove_stmt_references (gsi_stmt (bsi));
5376 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5377 &&(e = id->dst_node->get_edge (gsi_stmt (bsi))) != NULL)
5379 if (!e->inline_failed)
5380 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5381 else
5382 e->remove ();
5384 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES
5385 && id->dst_node->clones)
5386 for (node = id->dst_node->clones; node != id->dst_node;)
5388 node->remove_stmt_references (gsi_stmt (bsi));
5389 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5390 && (e = node->get_edge (gsi_stmt (bsi))) != NULL)
5392 if (!e->inline_failed)
5393 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5394 else
5395 e->remove ();
5398 if (node->clones)
5399 node = node->clones;
5400 else if (node->next_sibling_clone)
5401 node = node->next_sibling_clone;
5402 else
5404 while (node != id->dst_node && !node->next_sibling_clone)
5405 node = node->clone_of;
5406 if (node != id->dst_node)
5407 node = node->next_sibling_clone;
5411 delete_basic_block (b);
5412 changed = true;
5416 return changed;
5419 /* Update clone info after duplication. */
5421 static void
5422 update_clone_info (copy_body_data * id)
5424 struct cgraph_node *node;
5425 if (!id->dst_node->clones)
5426 return;
5427 for (node = id->dst_node->clones; node != id->dst_node;)
5429 /* First update replace maps to match the new body. */
5430 if (node->clone.tree_map)
5432 unsigned int i;
5433 for (i = 0; i < vec_safe_length (node->clone.tree_map); i++)
5435 struct ipa_replace_map *replace_info;
5436 replace_info = (*node->clone.tree_map)[i];
5437 walk_tree (&replace_info->old_tree, copy_tree_body_r, id, NULL);
5438 walk_tree (&replace_info->new_tree, copy_tree_body_r, id, NULL);
5441 if (node->clones)
5442 node = node->clones;
5443 else if (node->next_sibling_clone)
5444 node = node->next_sibling_clone;
5445 else
5447 while (node != id->dst_node && !node->next_sibling_clone)
5448 node = node->clone_of;
5449 if (node != id->dst_node)
5450 node = node->next_sibling_clone;
5455 /* Create a copy of a function's tree.
5456 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5457 of the original function and the new copied function
5458 respectively. In case we want to replace a DECL
5459 tree with another tree while duplicating the function's
5460 body, TREE_MAP represents the mapping between these
5461 trees. If UPDATE_CLONES is set, the call_stmt fields
5462 of edges of clones of the function will be updated.
5464 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5465 from new version.
5466 If SKIP_RETURN is true, the new version will return void.
5467 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5468 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5470 void
5471 tree_function_versioning (tree old_decl, tree new_decl,
5472 vec<ipa_replace_map *, va_gc> *tree_map,
5473 bool update_clones, bitmap args_to_skip,
5474 bool skip_return, bitmap blocks_to_copy,
5475 basic_block new_entry)
5477 struct cgraph_node *old_version_node;
5478 struct cgraph_node *new_version_node;
5479 copy_body_data id;
5480 tree p;
5481 unsigned i;
5482 struct ipa_replace_map *replace_info;
5483 basic_block old_entry_block, bb;
5484 auto_vec<gimple, 10> init_stmts;
5485 tree vars = NULL_TREE;
5487 gcc_assert (TREE_CODE (old_decl) == FUNCTION_DECL
5488 && TREE_CODE (new_decl) == FUNCTION_DECL);
5489 DECL_POSSIBLY_INLINED (old_decl) = 1;
5491 old_version_node = cgraph_node::get (old_decl);
5492 gcc_checking_assert (old_version_node);
5493 new_version_node = cgraph_node::get (new_decl);
5494 gcc_checking_assert (new_version_node);
5496 /* Copy over debug args. */
5497 if (DECL_HAS_DEBUG_ARGS_P (old_decl))
5499 vec<tree, va_gc> **new_debug_args, **old_debug_args;
5500 gcc_checking_assert (decl_debug_args_lookup (new_decl) == NULL);
5501 DECL_HAS_DEBUG_ARGS_P (new_decl) = 0;
5502 old_debug_args = decl_debug_args_lookup (old_decl);
5503 if (old_debug_args)
5505 new_debug_args = decl_debug_args_insert (new_decl);
5506 *new_debug_args = vec_safe_copy (*old_debug_args);
5510 /* Output the inlining info for this abstract function, since it has been
5511 inlined. If we don't do this now, we can lose the information about the
5512 variables in the function when the blocks get blown away as soon as we
5513 remove the cgraph node. */
5514 (*debug_hooks->outlining_inline_function) (old_decl);
5516 DECL_ARTIFICIAL (new_decl) = 1;
5517 DECL_ABSTRACT_ORIGIN (new_decl) = DECL_ORIGIN (old_decl);
5518 if (DECL_ORIGIN (old_decl) == old_decl)
5519 old_version_node->used_as_abstract_origin = true;
5520 DECL_FUNCTION_PERSONALITY (new_decl) = DECL_FUNCTION_PERSONALITY (old_decl);
5522 /* Prepare the data structures for the tree copy. */
5523 memset (&id, 0, sizeof (id));
5525 /* Generate a new name for the new version. */
5526 id.statements_to_fold = new hash_set<gimple>;
5528 id.decl_map = new hash_map<tree, tree>;
5529 id.debug_map = NULL;
5530 id.src_fn = old_decl;
5531 id.dst_fn = new_decl;
5532 id.src_node = old_version_node;
5533 id.dst_node = new_version_node;
5534 id.src_cfun = DECL_STRUCT_FUNCTION (old_decl);
5535 id.blocks_to_copy = blocks_to_copy;
5537 id.copy_decl = copy_decl_no_change;
5538 id.transform_call_graph_edges
5539 = update_clones ? CB_CGE_MOVE_CLONES : CB_CGE_MOVE;
5540 id.transform_new_cfg = true;
5541 id.transform_return_to_modify = false;
5542 id.transform_parameter = false;
5543 id.transform_lang_insert_block = NULL;
5545 old_entry_block = ENTRY_BLOCK_PTR_FOR_FN
5546 (DECL_STRUCT_FUNCTION (old_decl));
5547 DECL_RESULT (new_decl) = DECL_RESULT (old_decl);
5548 DECL_ARGUMENTS (new_decl) = DECL_ARGUMENTS (old_decl);
5549 initialize_cfun (new_decl, old_decl,
5550 old_entry_block->count);
5551 if (DECL_STRUCT_FUNCTION (new_decl)->gimple_df)
5552 DECL_STRUCT_FUNCTION (new_decl)->gimple_df->ipa_pta
5553 = id.src_cfun->gimple_df->ipa_pta;
5555 /* Copy the function's static chain. */
5556 p = DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl;
5557 if (p)
5558 DECL_STRUCT_FUNCTION (new_decl)->static_chain_decl =
5559 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl,
5560 &id);
5562 /* If there's a tree_map, prepare for substitution. */
5563 if (tree_map)
5564 for (i = 0; i < tree_map->length (); i++)
5566 gimple init;
5567 replace_info = (*tree_map)[i];
5568 if (replace_info->replace_p)
5570 if (!replace_info->old_tree)
5572 int i = replace_info->parm_num;
5573 tree parm;
5574 tree req_type;
5576 for (parm = DECL_ARGUMENTS (old_decl); i; parm = DECL_CHAIN (parm))
5577 i --;
5578 replace_info->old_tree = parm;
5579 req_type = TREE_TYPE (parm);
5580 if (!useless_type_conversion_p (req_type, TREE_TYPE (replace_info->new_tree)))
5582 if (fold_convertible_p (req_type, replace_info->new_tree))
5583 replace_info->new_tree = fold_build1 (NOP_EXPR, req_type, replace_info->new_tree);
5584 else if (TYPE_SIZE (req_type) == TYPE_SIZE (TREE_TYPE (replace_info->new_tree)))
5585 replace_info->new_tree = fold_build1 (VIEW_CONVERT_EXPR, req_type, replace_info->new_tree);
5586 else
5588 if (dump_file)
5590 fprintf (dump_file, " const ");
5591 print_generic_expr (dump_file, replace_info->new_tree, 0);
5592 fprintf (dump_file, " can't be converted to param ");
5593 print_generic_expr (dump_file, parm, 0);
5594 fprintf (dump_file, "\n");
5596 replace_info->old_tree = NULL;
5600 else
5601 gcc_assert (TREE_CODE (replace_info->old_tree) == PARM_DECL);
5602 if (replace_info->old_tree)
5604 init = setup_one_parameter (&id, replace_info->old_tree,
5605 replace_info->new_tree, id.src_fn,
5606 NULL,
5607 &vars);
5608 if (init)
5609 init_stmts.safe_push (init);
5613 /* Copy the function's arguments. */
5614 if (DECL_ARGUMENTS (old_decl) != NULL_TREE)
5615 DECL_ARGUMENTS (new_decl) =
5616 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl), &id,
5617 args_to_skip, &vars);
5619 DECL_INITIAL (new_decl) = remap_blocks (DECL_INITIAL (id.src_fn), &id);
5620 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl)) = new_decl;
5622 declare_inline_vars (DECL_INITIAL (new_decl), vars);
5624 if (!vec_safe_is_empty (DECL_STRUCT_FUNCTION (old_decl)->local_decls))
5625 /* Add local vars. */
5626 add_local_variables (DECL_STRUCT_FUNCTION (old_decl), cfun, &id);
5628 if (DECL_RESULT (old_decl) == NULL_TREE)
5630 else if (skip_return && !VOID_TYPE_P (TREE_TYPE (DECL_RESULT (old_decl))))
5632 DECL_RESULT (new_decl)
5633 = build_decl (DECL_SOURCE_LOCATION (DECL_RESULT (old_decl)),
5634 RESULT_DECL, NULL_TREE, void_type_node);
5635 DECL_CONTEXT (DECL_RESULT (new_decl)) = new_decl;
5636 cfun->returns_struct = 0;
5637 cfun->returns_pcc_struct = 0;
5639 else
5641 tree old_name;
5642 DECL_RESULT (new_decl) = remap_decl (DECL_RESULT (old_decl), &id);
5643 lang_hooks.dup_lang_specific_decl (DECL_RESULT (new_decl));
5644 if (gimple_in_ssa_p (id.src_cfun)
5645 && DECL_BY_REFERENCE (DECL_RESULT (old_decl))
5646 && (old_name = ssa_default_def (id.src_cfun, DECL_RESULT (old_decl))))
5648 tree new_name = make_ssa_name (DECL_RESULT (new_decl), NULL);
5649 insert_decl_map (&id, old_name, new_name);
5650 SSA_NAME_DEF_STMT (new_name) = gimple_build_nop ();
5651 set_ssa_default_def (cfun, DECL_RESULT (new_decl), new_name);
5655 /* Set up the destination functions loop tree. */
5656 if (loops_for_fn (DECL_STRUCT_FUNCTION (old_decl)) != NULL)
5658 cfun->curr_properties &= ~PROP_loops;
5659 loop_optimizer_init (AVOID_CFG_MODIFICATIONS);
5660 cfun->curr_properties |= PROP_loops;
5663 /* Copy the Function's body. */
5664 copy_body (&id, old_entry_block->count, REG_BR_PROB_BASE,
5665 ENTRY_BLOCK_PTR_FOR_FN (cfun), EXIT_BLOCK_PTR_FOR_FN (cfun),
5666 new_entry);
5668 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5669 number_blocks (new_decl);
5671 /* We want to create the BB unconditionally, so that the addition of
5672 debug stmts doesn't affect BB count, which may in the end cause
5673 codegen differences. */
5674 bb = split_edge (single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
5675 while (init_stmts.length ())
5676 insert_init_stmt (&id, bb, init_stmts.pop ());
5677 update_clone_info (&id);
5679 /* Remap the nonlocal_goto_save_area, if any. */
5680 if (cfun->nonlocal_goto_save_area)
5682 struct walk_stmt_info wi;
5684 memset (&wi, 0, sizeof (wi));
5685 wi.info = &id;
5686 walk_tree (&cfun->nonlocal_goto_save_area, remap_gimple_op_r, &wi, NULL);
5689 /* Clean up. */
5690 delete id.decl_map;
5691 if (id.debug_map)
5692 delete id.debug_map;
5693 free_dominance_info (CDI_DOMINATORS);
5694 free_dominance_info (CDI_POST_DOMINATORS);
5696 fold_marked_statements (0, id.statements_to_fold);
5697 delete id.statements_to_fold;
5698 fold_cond_expr_cond ();
5699 delete_unreachable_blocks_update_callgraph (&id);
5700 if (id.dst_node->definition)
5701 cgraph_edge::rebuild_references ();
5702 if (loops_state_satisfies_p (LOOPS_NEED_FIXUP))
5704 calculate_dominance_info (CDI_DOMINATORS);
5705 fix_loop_structure (NULL);
5707 update_ssa (TODO_update_ssa);
5709 /* After partial cloning we need to rescale frequencies, so they are
5710 within proper range in the cloned function. */
5711 if (new_entry)
5713 struct cgraph_edge *e;
5714 rebuild_frequencies ();
5716 new_version_node->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5717 for (e = new_version_node->callees; e; e = e->next_callee)
5719 basic_block bb = gimple_bb (e->call_stmt);
5720 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5721 bb);
5722 e->count = bb->count;
5724 for (e = new_version_node->indirect_calls; e; e = e->next_callee)
5726 basic_block bb = gimple_bb (e->call_stmt);
5727 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5728 bb);
5729 e->count = bb->count;
5733 free_dominance_info (CDI_DOMINATORS);
5734 free_dominance_info (CDI_POST_DOMINATORS);
5736 gcc_assert (!id.debug_stmts.exists ());
5737 pop_cfun ();
5738 return;
5741 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5742 the callee and return the inlined body on success. */
5744 tree
5745 maybe_inline_call_in_expr (tree exp)
5747 tree fn = get_callee_fndecl (exp);
5749 /* We can only try to inline "const" functions. */
5750 if (fn && TREE_READONLY (fn) && DECL_SAVED_TREE (fn))
5752 call_expr_arg_iterator iter;
5753 copy_body_data id;
5754 tree param, arg, t;
5755 hash_map<tree, tree> decl_map;
5757 /* Remap the parameters. */
5758 for (param = DECL_ARGUMENTS (fn), arg = first_call_expr_arg (exp, &iter);
5759 param;
5760 param = DECL_CHAIN (param), arg = next_call_expr_arg (&iter))
5761 decl_map.put (param, arg);
5763 memset (&id, 0, sizeof (id));
5764 id.src_fn = fn;
5765 id.dst_fn = current_function_decl;
5766 id.src_cfun = DECL_STRUCT_FUNCTION (fn);
5767 id.decl_map = &decl_map;
5769 id.copy_decl = copy_decl_no_change;
5770 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
5771 id.transform_new_cfg = false;
5772 id.transform_return_to_modify = true;
5773 id.transform_parameter = true;
5774 id.transform_lang_insert_block = NULL;
5776 /* Make sure not to unshare trees behind the front-end's back
5777 since front-end specific mechanisms may rely on sharing. */
5778 id.regimplify = false;
5779 id.do_not_unshare = true;
5781 /* We're not inside any EH region. */
5782 id.eh_lp_nr = 0;
5784 t = copy_tree_body (&id);
5786 /* We can only return something suitable for use in a GENERIC
5787 expression tree. */
5788 if (TREE_CODE (t) == MODIFY_EXPR)
5789 return TREE_OPERAND (t, 1);
5792 return NULL_TREE;
5795 /* Duplicate a type, fields and all. */
5797 tree
5798 build_duplicate_type (tree type)
5800 struct copy_body_data id;
5802 memset (&id, 0, sizeof (id));
5803 id.src_fn = current_function_decl;
5804 id.dst_fn = current_function_decl;
5805 id.src_cfun = cfun;
5806 id.decl_map = new hash_map<tree, tree>;
5807 id.debug_map = NULL;
5808 id.copy_decl = copy_decl_no_change;
5810 type = remap_type_1 (type, &id);
5812 delete id.decl_map;
5813 if (id.debug_map)
5814 delete id.debug_map;
5816 TYPE_CANONICAL (type) = type;
5818 return type;
5821 /* Unshare the entire DECL_SAVED_TREE of FN and return the remapped
5822 parameters and RESULT_DECL in PARMS and RESULT. Used by C++ constexpr
5823 evaluation. */
5825 tree
5826 copy_fn (tree fn, tree& parms, tree& result)
5828 copy_body_data id;
5829 tree param;
5830 hash_map<tree, tree> decl_map;
5832 tree *p = &parms;
5833 *p = NULL_TREE;
5835 memset (&id, 0, sizeof (id));
5836 id.src_fn = fn;
5837 id.dst_fn = current_function_decl;
5838 id.src_cfun = DECL_STRUCT_FUNCTION (fn);
5839 id.decl_map = &decl_map;
5841 id.copy_decl = copy_decl_no_change;
5842 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
5843 id.transform_new_cfg = false;
5844 id.transform_return_to_modify = false;
5845 id.transform_parameter = true;
5846 id.transform_lang_insert_block = NULL;
5848 /* Make sure not to unshare trees behind the front-end's back
5849 since front-end specific mechanisms may rely on sharing. */
5850 id.regimplify = false;
5851 id.do_not_unshare = true;
5853 /* We're not inside any EH region. */
5854 id.eh_lp_nr = 0;
5856 /* Remap the parameters and result and return them to the caller. */
5857 for (param = DECL_ARGUMENTS (fn);
5858 param;
5859 param = DECL_CHAIN (param))
5861 *p = remap_decl (param, &id);
5862 p = &DECL_CHAIN (*p);
5865 if (DECL_RESULT (fn))
5866 result = remap_decl (DECL_RESULT (fn), &id);
5867 else
5868 result = NULL_TREE;
5870 return copy_tree_body (&id);